<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Cancer</journal-id><journal-id journal-id-type="publisher-id">cancer</journal-id><journal-id journal-id-type="index">21</journal-id><journal-title>JMIR Cancer</journal-title><abbrev-journal-title>JMIR Cancer</abbrev-journal-title><issn pub-type="epub">2369-1999</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v11i1e64685</article-id><article-id pub-id-type="doi">10.2196/64685</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Predicting Pathological Complete Response Following Neoadjuvant Therapy in Patients With Breast Cancer: Development of Machine Learning&#x2013;Based Prediction Models in a Retrospective Study</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Lai</surname><given-names>Chun-Chi</given-names></name><degrees>MSc, MD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Chen</surname><given-names>Cheng-Yu</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff4">4</xref><xref ref-type="aff" rid="aff5">5</xref><xref ref-type="aff" rid="aff6">6</xref><xref ref-type="aff" rid="aff7">7</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" corresp="yes" equal-contrib="yes"><name name-style="western"><surname>Chang</surname><given-names>Tzu-Hao</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff8">8</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib></contrib-group><aff id="aff1"><institution>Graduate Institute of Biomedical Informatics, College of Medical Science and Technology, Taipei Medical University</institution><addr-line>9th Floor, 301 Yuantong Road, Zhonghe District</addr-line><addr-line>Taipei</addr-line><country>Taiwan</country></aff><aff id="aff2"><institution>Division of General Surgery, Department of Surgery, New Taipei Municipal TuCheng Hospital</institution><addr-line>New Taipei City</addr-line><country>Taiwan</country></aff><aff id="aff3"><institution>Department of Medical Imaging, Taipei Medical University Hospital</institution><addr-line>Taipei</addr-line><country>Taiwan</country></aff><aff id="aff4"><institution>Department of Radiology, School of Medicine, College of Medicine, Taipei Medical University</institution><addr-line>Taipei</addr-line><country>Taiwan</country></aff><aff id="aff5"><institution>Research Center for Artificial Intelligence in Medicine, Taipei Medical University</institution><addr-line>Taipei</addr-line><country>Taiwan</country></aff><aff id="aff6"><institution>Department of Radiology, National Defense Medical Center</institution><addr-line>Taipei</addr-line><country>Taiwan</country></aff><aff id="aff7"><institution>Translational Imaging Research Center, Taipei Medical University Hospital</institution><addr-line>Taipei</addr-line><country>Taiwan</country></aff><aff id="aff8"><institution>Clinical Big Data Research Center, Taipei Medical University Hospital</institution><addr-line>Taipei</addr-line><country>Taiwan</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Cahill</surname><given-names>Naomi</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Bracken-Clarke</surname><given-names>Dara</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Liu</surname><given-names>Yinhua</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Tzu-Hao Chang, PhD, Graduate Institute of Biomedical Informatics, College of Medical Science and Technology, Taipei Medical University, 9th Floor, 301 Yuantong Road, Zhonghe District, Taipei, Taiwan, 886 66202589 ext 10928; <email>kevinchang@tmu.edu.tw</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>18</day><month>7</month><year>2025</year></pub-date><volume>11</volume><elocation-id>e64685</elocation-id><history><date date-type="received"><day>23</day><month>07</month><year>2024</year></date><date date-type="rev-recd"><day>23</day><month>04</month><year>2025</year></date><date date-type="accepted"><day>24</day><month>04</month><year>2025</year></date></history><copyright-statement>&#x00A9; Chun-Chi Lai, Cheng-Yu Chen, Tzu-Hao Chang. Originally published in JMIR Cancer (<ext-link ext-link-type="uri" xlink:href="https://cancer.jmir.org">https://cancer.jmir.org</ext-link>), 18.7.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Cancer, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://cancer.jmir.org/">https://cancer.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://cancer.jmir.org/2025/1/e64685"/><abstract><sec><title>Background</title><p>Breast cancer is the most prevalent form of cancer worldwide, with 2.3 million new diagnoses in 2022. Recent advancements in treatment have led to a shift in the use of chemotherapy-targeted immunotherapy from a postoperative adjuvant to a preoperative neoadjuvant approach in select cases, resulting in enhanced survival outcomes. A pathological complete response (pCR) is a critical prognostic marker, with higher pCR rates linked to improved overall and disease-free survival.</p></sec><sec><title>Objective</title><p>The objective of this study was to develop robust, machine learning&#x2013;based prediction models for pCR following neoadjuvant therapy, leveraging clinical, laboratory, and imaging data.</p></sec><sec sec-type="methods"><title>Methods</title><p>A retrospective cohort study was conducted using data from the Taipei Medical University Clinical Research Database from 2015 to 2022. Eligible patients were those with breast cancer who received neoadjuvant therapy followed by curative surgical resection. Machine learning models were developed using 3 distinct sets of variables. Model 1 included 14 clinical features such as age, height, weight, tumor stage, receptor status, tumor markers, and intrinsic subtype. Model 2 expanded on this by incorporating additional laboratory data and comorbidities (29 variables in total). Model 3 added breast sonography response data to the clinical variables in model 1. Algorithms including logistic regression, random forest, support vector machines, and extreme gradient boosting were used. Feature selection was performed using recursive feature elimination with cross-validation, and model performance was assessed using accuracy and area under the receiver operating characteristic curve (AUROC).</p></sec><sec sec-type="results"><title>Results</title><p>A total of 334 patients were analyzed, with 199 in the non-pCR group and 135 in the pCR group. The application of logistic regression with recursive feature elimination with cross-validation was found to demonstrate the optimal performance among the various algorithms that were evaluated in this study. Model 1 attained a mean accuracy of 0.66 (SD 0.02) and a mean AUROC of 0.73 (SD 0.01). The incorporation of laboratory data and comorbidities in model 2 did not yield significant enhancement, with a mean accuracy of 0.67 (SD 0.02) and a mean AUROC of 0.73 (SD 0.01). The incorporation of breast sonography response in model 3 led to a modest enhancement in predictive performance for the sonography group (accuracy 0.68; AUROC 0.60) in comparison to the nonsonography group (accuracy 0.66; AUROC 0.55). Despite the modest sample size (41 patients) of model 3, the integration of sonography data appeared to offer additional value in predicting pCR and warrants further investigation.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>This study suggests that incorporating breast sonography into models with clinical and laboratory data may modestly improve pCR prediction. It is important to note that the findings of this study are preliminary and require cautious interpretation. Further studies are required to validate this approach and support its integration into a machine learning&#x2013;based clinical workflow.</p></sec></abstract><kwd-group><kwd>breast cancer</kwd><kwd>neoadjuvant therapy</kwd><kwd>pathological complete response</kwd><kwd>breast sonography</kwd><kwd>machine learning</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><sec id="s1-1"><title>Breast Cancer and Treatment Strategies</title><p>Breast cancer is the most prevalent cancer worldwide, with approximately 2.3 million women diagnosed and 670,000 deaths reported in 2022 [<xref ref-type="bibr" rid="ref1">1</xref>]. In Taiwan, the disease is also the most prevalent form of cancer among women, with an annual incidence of 15,000 new cases [<xref ref-type="bibr" rid="ref2">2</xref>]. Treatment strategies for breast cancer are highly personalized, encompassing surgery, chemotherapy, targeted therapy, immunotherapy, hormone therapy, and radiotherapy [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. Historically, the sequence of chemotherapy, targeted therapy, and immunotherapy was implemented as an adjuvant treatment following surgery. However, in certain circumstances, it is now used as neoadjuvant therapy, administered prior to surgery, to optimize outcomes [<xref ref-type="bibr" rid="ref5">5</xref>].</p></sec><sec id="s1-2"><title>The Role and Advantages of Neoadjuvant Therapy</title><p>Neoadjuvant therapy confers a number of clinical advantages, including the potential to reduce the size of the tumor, thereby enabling breast-conserving surgery in patients who might otherwise require mastectomy. This approach also provides a critical window to monitor tumor regression and assess pathological responses, which are strongly correlated with improved overall survival and disease-free survival [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. It is imperative to acknowledge that the efficacy of neoadjuvant therapy exhibits substantial intrinsic subtype variability, underscoring the necessity for subtype-specific therapeutic strategies.</p><p>Current guidelines recommend neoadjuvant therapy for patients with &#x2265; cT2 or cN(+) luminal-type breast cancer and &#x2265; cT1c, cN0 human epidermal growth factor receptor 2 (HER2)-positive or triple-negative breast cancer (TNBC) [<xref ref-type="bibr" rid="ref9">9</xref>]. In the context of HER2-positive breast cancer, the Adjuvant Paclitaxel and Trastuzumab trial has demonstrated the efficacy of a de-escalated regimen of TH (paclitaxel and trastuzumab) for 12 cycles in achieving excellent outcomes for lower-risk patients [<xref ref-type="bibr" rid="ref10">10</xref>]. In the context of TNBC, the incorporation of carboplatin into standard neoadjuvant chemotherapy has been shown to result in a substantial enhancement in pathological complete response (pCR) rates [<xref ref-type="bibr" rid="ref11">11</xref>]. Moreover, the addition of pembrolizumab in conjunction with chemotherapy has been observed to further augment pCR rates and event-free survival, particularly in cases classified as high risk [<xref ref-type="bibr" rid="ref12">12</xref>].</p><p>An accurate assessment of tumor response is imperative for the optimization of neoadjuvant therapy strategies. Previous studies have investigated a multitude of factors to predict pCR in patients with breast cancer undergoing neoadjuvant therapy [<xref ref-type="bibr" rid="ref13">13</xref>]. Imaging modalities, such as breast sonography, are valuable for evaluating tumor size and margins, with a sensitivity of 61% and specificity of 78% [<xref ref-type="bibr" rid="ref14">14</xref>]. Breast sonography plays a pivotal role in assessing response during treatment and complementing clinical examination, which remains a reliable and accessible method for evaluating palpable lesions. This dual approach enables the timely identification of nonresponders, who can then be spared the adverse effects of ineffective chemotherapy and redirected to alternative therapeutic strategies with potentially greater efficacy [<xref ref-type="bibr" rid="ref15">15</xref>].</p><p>Despite the variability in pCR rates (10%&#x2010;60%) across different breast cancer intrinsic subtypes, accurate prediction of pCR using a combination of clinical features, imaging techniques, and pathology remains critical for tailoring treatment and improving outcomes [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>].</p></sec><sec id="s1-3"><title>Study Objective</title><p>The objective of this study is to develop a user-friendly prediction model for pCR after neoadjuvant therapy by integrating clinical features, advanced machine learning techniques, and breast sonography data. The implementation of such a model has the potential to facilitate the early identification of nonresponders, thereby enabling timely therapeutic adjustments and averting the administration of ineffective treatments. The ultimate implementation of this model in clinical practice could enhance personalized treatment plans, improve patient outcomes, and optimize health care resource use.</p></sec></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Design and Data Source</title><p>This retrospective cohort study used data from the Taipei Medical University Clinical Research Database (TMU-CRD), an electronic medical record system established in 2015. The dataset used in this study was exclusively derived from the TMU-CRD, which consolidates data from 3 affiliated academic hospitals: Taipei Medical University Hospital, Wan Fang Hospital, and Shuang Ho Hospital. The database is managed and maintained by these academic centers, ensuring high data quality and reliability. The TMU-CRD encompasses both structured data, including patient demographics, International Classification of Diseases codes, laboratory results, treatment procedures, medication records, and cancer registry entries, as well as unstructured data, comprising physician notes, imaging reports, and pathological reports. As of 2024, the database encompasses data from 1998 to 2022 and contains the medical records of nearly 4.3 million patients across Taiwan.</p></sec><sec id="s2-2"><title>Patient Selection</title><p>The population of this study included patients diagnosed with breast cancer who underwent neoadjuvant therapy followed by curative-intent surgical resection. Patients were identified using a specific label in the cancer registry that indicated neoadjuvant treatment. Exclusion criteria encompassed instances where chemotherapy records were incomplete, where chemotherapy was not administered prior to surgery, and the presence of metastatic disease. Following the application of these criteria, a final cohort of 334 patients was identified for the purposes of analysis.</p></sec><sec id="s2-3"><title>Data Collection</title><p>A comprehensive dataset, encompassing clinical and imaging parameters, was meticulously collected to develop predictive models for pCR. The demographic variables included age, height, and weight, clinical tumor size, clinical TNM stage, hormone receptor (estrogen receptor [ER] or progesterone receptor [PR]) status, HER2 status, Ki-67 expression, breast cancer intrinsic subtype, Nottingham Bloom Richardson (NBR) grading, carcinoembryonic antigen (CEA) levels, carbohydrate antigen 15&#x2010;3 (CA15-3) levels, laboratory test results, and comorbidities. The intrinsic subtypes of breast cancer were categorized as hormone receptor-positive, HER2-positive, and triple-negative. The evaluation of imaging data, specifically breast sonography responses, was conducted based on Response Evaluation Criteria in Solid Tumors criteria and categorized into complete response, partial response, stable disease, or progression disease. The pathological response was classified as complete response (ypT0/Tis and ypN0) or residual disease.</p><p>The Allred scoring system was used to determine hormone receptor (ER or PR) status. The assessment of HER2 status was conducted through immunohistochemistry, and cases that yielded a score of 2+ underwent additional evaluation via fluorescence in situ hybridization. The TNM staging was determined according to the American Joint Committee on Cancer guidelines.</p></sec><sec id="s2-4"><title>Machine Learning Models</title><p>Three models were constructed for the development of machine learning models to predict pCR. Model 1 consisted of 14 clinical parameters, including age, height, weight, BMI, tumor size, clinical N stage, ER status, PR status, HER2 status, Ki-67 expression, NBR grading, CEA levels, CA15-3 levels, and breast cancer intrinsic subtype. Model 2 expanded upon model 1 by incorporating additional laboratory test results and comorbidities, resulting in a total of 29 variables. Model 3 included the parameters from model 1 and integrated breast sonography response data as an additional feature. Due to limited sonography data availability, this dataset included only 41 patients. Model 2 expanded upon model 1 by incorporating additional laboratory test results and comorbidities, resulting in a total of 29 variables.</p></sec><sec id="s2-5"><title>Statistical Analysis and Machine Learning Approach</title><p>Univariate analysis was performed using 2-tailed <italic>t</italic> tests and chi-square tests to identify significant differences between the pCR and non-pCR groups. Features that exhibited statistical significance (<italic>P</italic>&#x003C;.05) and those that were supported by existing literature were selected for model construction. Missing values were addressed through the implementation of imputation methods, with mean imputation being applied to continuous variables and an additional category being created for categorical variables. With regard to missing values, we excluded variables for which more than 30% of data points were missing.</p><p>The performance of the model was evaluated using accuracy and the area under the receiver operating characteristic curve (AUROC). The AUROC is a metric that quantifies a model&#x2019;s ability to distinguish between 2 classes (eg, pCR vs non-pCR) by plotting the true positive rate (sensitivity) against the false positive rate (1&#x2212;specificity) at various thresholds. An AUROC value of 1.0 indicates perfect classification, while a value of 0.5 represents no better performance than random chance. The College of American Pathologists asserts that an area under the curve below 0.6 indicates inadequate discriminative ability, values between 0.6 and 0.75 suggest beneficial discrimination, and values above 0.75 reflect substantial clinical utility. It is therefore generally recommended that an AUROC of at least 0.6 is attained for a prognostic model if its use in clinical settings for the prediction of cancer outcomes is to be considered beneficial [<xref ref-type="bibr" rid="ref18">18</xref>].</p><p>The 3 models were analyzed using the following algorithms: logistic regression (LR), random forest, support vector machine, and extreme gradient boosting. The feature selection process was optimized through the implementation of recursive feature elimination with cross-validation. The training and testing datasets were partitioned into 80% and 20% of the total data, respectively, with the exception of model 3, where leave-one-out cross-validation (LOO-CV) was used due to the limited sample size. To interpret the importance of breast sonography in model 3, Shapley Additive Explanations (SHAP) were used. The SHAP values were computed using the SHAP Python package in order to quantify the contribution of each feature to the model&#x2019;s output. The mean absolute SHAP value was used to summarize feature importance, and the median rank of sonography response was calculated by comparing its importance across all features for each prediction. The performance of each model was evaluated using accuracy and AUROC metrics.</p></sec><sec id="s2-6"><title>Ethical Considerations</title><p>The study was reviewed and approved by the institutional review board (IRB) of Taipei Medical University, Taipei, Taiwan (IRB N202305036). The study entailed secondary analysis of deidentified data procured from the Taipei Medical University Clinical Research Database. In accordance with the regulations established by the IRB and the institutional policy, the requirement for informed consent was waived due to the fact that no personally identifiable information was accessed. The research was conducted in accordance with the ethical standards outlined in the Declaration of Helsinki. The participants did not receive any form of financial compensation, and no direct interaction occurred between the participants and the investigators. The maintenance of data privacy and confidentiality was strictly enforced throughout the study.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Basic Characteristics</title><p>We identified 334 patients from the 3 hospital datasets. These patients were stratified into 2 groups based on their pCR status: the non-pCR group, comprising 199 (59.5%) individuals, and the pCR group, comprising 135 (40.4%) individuals. Univariate analysis revealed significant differences between the 2 groups in several clinical parameters, including tumor size, clinical T stage, ER status, PR status, HER2 status, Ki-67 expression, breast cancer intrinsic subtype, CA15-3 levels, and hemoglobin concentrations. However, no significant differences were observed in age, BMI, clinical N stage, overall clinical stage, NBR grading, or CEA levels (<xref ref-type="table" rid="table1">Table 1</xref>).</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Demographic data according to pCR<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> (N=334).</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="top" colspan="2"/><td align="left" valign="top">Non-pCR (n=199)</td><td align="left" valign="top">pCR (n=135)</td><td align="left" valign="top"><italic>P</italic> value<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td></tr></thead><tbody><tr><td align="left" valign="top" colspan="2">Age (years), mean (SD)</td><td align="char" char="." valign="top">53.6 (11.5)</td><td align="char" char="." valign="top">52.4 (10.5)</td><td align="char" char="." valign="top">.35</td></tr><tr><td align="left" valign="top" colspan="2">Height (cm), mean (SD)</td><td align="char" char="." valign="top">157.1 (5.6)</td><td align="char" char="." valign="top">157.1 (6.1)</td><td align="char" char="." valign="top">.93</td></tr><tr><td align="left" valign="top" colspan="2">Weight (kg), mean (SD)</td><td align="char" char="." valign="top">60.2 (10.7)</td><td align="char" char="." valign="top">60.1 (11.7)</td><td align="char" char="." valign="top">.90</td></tr><tr><td align="left" valign="top" colspan="2">BMI, mean (SD)</td><td align="char" char="." valign="top">24.4 (4.4)</td><td align="char" char="." valign="top">24.4 (4.8)</td><td align="char" char="." valign="top">.93</td></tr><tr><td align="left" valign="top" colspan="4">Clinical tumor size (mm)</td><td align="char" char="." valign="top">.01</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Mean (SD)</td><td align="char" char="." valign="top">47.9 (26.5)</td><td align="char" char="." valign="top">40.4 (22.8)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing, n (%)</td><td align="char" char="." valign="top">4 (2)</td><td align="char" char="." valign="top">7 (5.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">Clinical T stage, n (%)</td><td align="char" char="." valign="top">.01</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">T1</td><td align="char" char="." valign="top">16 (8)</td><td align="char" char="." valign="top">13 (9.6)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">T2</td><td align="char" char="." valign="top">100 (50.3)</td><td align="char" char="." valign="top">88 (65.2)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">T3</td><td align="char" char="." valign="top">53 (26.6)</td><td align="char" char="." valign="top">18 (13.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">T4</td><td align="char" char="." valign="top">30 (15.1)</td><td align="char" char="." valign="top">16 (11.9)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">Clinical N stage, n (%)</td><td align="char" char="." valign="top">.29</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">N0</td><td align="char" char="." valign="top">42 (21.1)</td><td align="char" char="." valign="top">39 (28.9)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">N1</td><td align="char" char="." valign="top">126 (63.3)</td><td align="char" char="." valign="top">73 (54.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">N2</td><td align="char" char="." valign="top">22 (11.1)</td><td align="char" char="." valign="top">19 (14.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">N3</td><td align="char" char="." valign="top">9 (4.5)</td><td align="char" char="." valign="top">6 (4.4)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">Stage, n (%)</td><td align="char" char="." valign="top">.15</td></tr><tr><td align="left" valign="top"/><td align="char" char="." valign="top">1</td><td align="char" char="." valign="top">4 (2)</td><td align="char" char="." valign="top">4 (3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="char" char="." valign="top">2</td><td align="char" char="." valign="top">108 (54.3)</td><td align="char" char="." valign="top">86 (63.7)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="char" char="." valign="top">3</td><td align="char" char="." valign="top">87 (43.7)</td><td align="char" char="." valign="top">45 (33.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">ER<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup>, n (%)</td><td align="char" char="." valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Positive</td><td align="char" char="." valign="top">134 (67.3)</td><td align="char" char="." valign="top">61 (45.2)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Negative</td><td align="char" char="." valign="top">65 (32.7)</td><td align="char" char="." valign="top">74 (54.8)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">PR<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup>, n (%)</td><td align="char" char="." valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Positive</td><td align="char" char="." valign="top">117 (58.8)</td><td align="char" char="." valign="top">44 (32.6)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Negative</td><td align="char" char="." valign="top">82 (41.2)</td><td align="char" char="." valign="top">91 (67.4)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">HER2<sup><xref ref-type="table-fn" rid="table1fn5">e</xref></sup>, n (%)</td><td align="char" char="." valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Positive</td><td align="char" char="." valign="top">66 (33.2)</td><td align="char" char="." valign="top">89 (65.9)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Negative</td><td align="char" char="." valign="top">133 (66.8)</td><td align="char" char="." valign="top">46 (34.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">Ki-67</td><td align="char" char="." valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Mean (SD)</td><td align="char" char="." valign="top">39 (22.6)</td><td align="char" char="." valign="top">49.1 (22.6)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing, n (%)</td><td align="char" char="." valign="top">18 (9)</td><td align="char" char="." valign="top">10 (7.4)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">Subtype, n (%)</td><td align="char" char="." valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">HR<sup><xref ref-type="table-fn" rid="table1fn6">f</xref></sup> (+)</td><td align="char" char="." valign="top">100 (50.3)</td><td align="char" char="." valign="top">21 (15.6)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">HER2 (+)</td><td align="char" char="." valign="top">66 (33.2)</td><td align="char" char="." valign="top">89 (65.9)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">TNBC<sup><xref ref-type="table-fn" rid="table1fn7">g</xref></sup></td><td align="char" char="." valign="top">33 (16.6)</td><td align="char" char="." valign="top">25 (18.5)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">NBR<sup><xref ref-type="table-fn" rid="table1fn8">h</xref></sup>, n (%)</td><td align="char" char="." valign="top">.25</td></tr><tr><td align="left" valign="top"/><td align="char" char="." valign="top">0</td><td align="char" char="." valign="top">4 (2)</td><td align="char" char="." valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="char" char="." valign="top">1</td><td align="char" char="." valign="top">79 (39.7)</td><td align="char" char="." valign="top">56 (41.5)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="char" char="." valign="top">2</td><td align="char" char="." valign="top">40 (20.1)</td><td align="char" char="." valign="top">26 (19.5)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing</td><td align="char" char="." valign="top">76 (38.1)</td><td align="char" char="." valign="top">53 (39.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">CEA<sup><xref ref-type="table-fn" rid="table1fn9">i</xref></sup></td><td align="char" char="." valign="top">.12</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Mean (SD)</td><td align="char" char="." valign="top">10.7 (44.6)</td><td align="char" char="." valign="top">4.2 (7.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing, n (%)</td><td align="char" char="." valign="top">29 (14.5)</td><td align="char" char="." valign="top">16 (11.8)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">CA15-3<sup><xref ref-type="table-fn" rid="table1fn10">j</xref></sup></td><td align="char" char="." valign="top">.04</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Mean (SD)</td><td align="char" char="." valign="top">21.3 (37.8)</td><td align="char" char="." valign="top">14 (9.7)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing, n (%)</td><td align="char" char="." valign="top">32 (16)</td><td align="char" char="." valign="top">18 (13.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">WBC<sup><xref ref-type="table-fn" rid="table1fn11">k</xref></sup></td><td align="char" char="." valign="top">.34</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Mean (SD)</td><td align="char" char="." valign="top">7.12 (2.0)</td><td align="char" char="." valign="top">7.34 (2.2)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing, n (%)</td><td align="char" char="." valign="top">36 (18.1)</td><td align="char" char="." valign="top">16 (11.8)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">Hemoglobin</td><td align="char" char="." valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Mean (SD)</td><td align="char" char="." valign="top">12.7 (1.7)</td><td align="char" char="." valign="top">13.2 (1.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing, n (%)</td><td align="char" char="." valign="top">35 (17.6)</td><td align="char" char="." valign="top">16 (11.8)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">Platelet</td><td align="char" char="." valign="top">.93</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Mean (SD)</td><td align="char" char="." valign="top">268.4 (77.2)</td><td align="char" char="." valign="top">269.2 (62.6)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing, n (%)</td><td align="char" char="." valign="top">38 (19.1)</td><td align="char" char="." valign="top">16 (11.8)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">Lymphocyte</td><td align="char" char="." valign="top">.99</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Mean (SD)</td><td align="char" char="." valign="top">27.0 (7.7)</td><td align="char" char="." valign="top">27.0 (9.5)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing, n (%)</td><td align="char" char="." valign="top">55 (27.6)</td><td align="char" char="." valign="top">22 (16.2)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">Neutrophil</td><td align="char" char="." valign="top">.80</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Mean (SD)</td><td align="char" char="." valign="top">63.3 (8.6)</td><td align="char" char="." valign="top">63.6 (10.7)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing, n (%)</td><td align="char" char="." valign="top">55 (27.6)</td><td align="char" char="." valign="top">22 (16.2)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">BUN<sup><xref ref-type="table-fn" rid="table1fn12">l</xref></sup></td><td align="char" char="." valign="top">.92</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Mean (SD)</td><td align="char" char="." valign="top">12.7 (5.4)</td><td align="char" char="." valign="top">12.8 (4.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing, n (%)</td><td align="char" char="." valign="top">26 (13.1)</td><td align="char" char="." valign="top">18 (13.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">Creatinine</td><td align="char" char="." valign="top">.51</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Mean (SD)</td><td align="char" char="." valign="top">0.72 (0.5)</td><td align="char" char="." valign="top">0.68 (0.2)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing, n (%)</td><td align="char" char="." valign="top">19 (9.5)</td><td align="char" char="." valign="top">14 (10.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">GOT<sup><xref ref-type="table-fn" rid="table1fn13">m</xref></sup></td><td align="char" char="." valign="top">.89</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Mean (SD)</td><td align="char" char="." valign="top">22.4 (11.4)</td><td align="char" char="." valign="top">22.6 (11.8)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing, n (%)</td><td align="char" char="." valign="top">40 (20.1)</td><td align="char" char="." valign="top">19 (14.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">GPT<sup><xref ref-type="table-fn" rid="table1fn14">n</xref></sup></td><td align="char" char="." valign="top">.59</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Mean (SD)</td><td align="char" char="." valign="top">21.6 (19.1)</td><td align="char" char="." valign="top">22.8 (21.2)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing, n (%)</td><td align="char" char="." valign="top">32 (16.1)</td><td align="char" char="." valign="top">14 (10.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">Diabetes, n (%)</td><td align="char" char="." valign="top">.89</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Yes</td><td align="char" char="." valign="top">10 (5)</td><td align="char" char="." valign="top">7 (5.2)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">No</td><td align="char" char="." valign="top">170 (85.4)</td><td align="char" char="." valign="top">127 (94.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing</td><td align="char" char="." valign="top">19 (9.5)</td><td align="char" char="." valign="top">1 (0.7)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">Hypertension, n (%)</td><td align="char" char="." valign="top">.19</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Yes</td><td align="char" char="." valign="top">23 (11.6)</td><td align="char" char="." valign="top">11 (8.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">No</td><td align="char" char="." valign="top">157 (78.9)</td><td align="char" char="." valign="top">123 (91.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing</td><td align="char" char="." valign="top">19 (9.5)</td><td align="char" char="." valign="top">1 (0.7)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">Heart disease, n (%)</td><td align="char" char="." valign="top">.83</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Yes</td><td align="char" char="." valign="top">1 (0.5)</td><td align="char" char="." valign="top">1 (0.7)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">No</td><td align="char" char="." valign="top">179 (99)</td><td align="char" char="." valign="top">133 (98.5)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing</td><td align="char" char="." valign="top">1 (0.5)</td><td align="char" char="." valign="top">1 (0.7)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">Kidney disease, n (%)</td><td align="char" char="." valign="top">.08</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Yes</td><td align="char" char="." valign="top">4 (2)</td><td align="char" char="." valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">No</td><td align="char" char="." valign="top">176 (88.4)</td><td align="char" char="." valign="top">134 (99.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing</td><td align="char" char="." valign="top">19 (9.5)</td><td align="char" char="." valign="top">1 (0.7)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">Asthma, n (%)</td><td align="char" char="." valign="top">.83</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Yes</td><td align="char" char="." valign="top">1 (0.5)</td><td align="char" char="." valign="top">1 (0.7)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">No</td><td align="char" char="." valign="top">179 (89.9)</td><td align="char" char="." valign="top">133 (98.5)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing</td><td align="char" char="." valign="top">19 (9.5)</td><td align="char" char="." valign="top">1 (0.7)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">Hepatitis B, n (%)</td><td align="char" char="." valign="top">.91</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Yes</td><td align="char" char="." valign="top">5 (2.5)</td><td align="char" char="." valign="top">4 (3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">No</td><td align="char" char="." valign="top">175 (88)</td><td align="char" char="." valign="top">130 (96.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing</td><td align="char" char="." valign="top">19 (9.5)</td><td align="char" char="." valign="top">1 (0.7)</td><td align="left" valign="top"/></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>pCR: pathological complete response.</p></fn><fn id="table1fn2"><p><sup>b</sup><italic>P</italic> values are based on univariate analysis results using 2-tailed <italic>t</italic> tests and chi-square tests.</p></fn><fn id="table1fn3"><p><sup>c</sup>ER: estrogen receptor.</p></fn><fn id="table1fn4"><p><sup>d</sup>PR: progesterone receptor.</p></fn><fn id="table1fn5"><p><sup>e</sup>HER2: human epidermal growth factor receptor 2.</p></fn><fn id="table1fn6"><p><sup>f</sup>HR: hormone receptor.</p></fn><fn id="table1fn7"><p><sup>g</sup>TNBC: triple-negative breast cancer.</p></fn><fn id="table1fn8"><p><sup>h</sup>NBR: Nottingham Bloom Richardson.</p></fn><fn id="table1fn9"><p><sup>i</sup>CEA: carcinoembryonic antigen.</p></fn><fn id="table1fn10"><p><sup>j</sup>CA15-3: carbohydrate antigen 15-3.</p></fn><fn id="table1fn11"><p><sup>k</sup>WBC: white blood cell.</p></fn><fn id="table1fn12"><p><sup>l</sup>BUN: blood urea nitrogen.</p></fn><fn id="table1fn13"><p><sup>m</sup>GOT: glutamic oxaloacetic transaminase.</p></fn><fn id="table1fn14"><p><sup>n</sup>GPT: glutamic pyruvic transaminase.</p></fn></table-wrap-foot></table-wrap><p>Although breast sonography response did not achieve statistical significance in univariate analysis, a trend toward a higher pCR rate was observed in patients demonstrating superior sonography response (<xref ref-type="table" rid="table2">Table 2</xref>).</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Breast sonography responses with complete response and partial response are more likely to predict a pathological complete response (pCR) in final pathological result.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="top">Sonography response</td><td align="left" valign="top">Non-pCR (n=28), n (%)</td><td align="left" valign="top">pCR (n=13), n (%)</td></tr></thead><tbody><tr><td align="left" valign="top">Complete response</td><td align="char" char="." valign="top">2 (7.1)</td><td align="char" char="." valign="top">3 (23.1)</td></tr><tr><td align="left" valign="top">Partial response</td><td align="char" char="." valign="top">13 (46.4)</td><td align="char" char="." valign="top">8 (61.5)</td></tr><tr><td align="left" valign="top">Stable disease</td><td align="char" char="." valign="top">12 (42.9)</td><td align="char" char="." valign="top">2 (15.4)</td></tr><tr><td align="left" valign="top">Progression disease</td><td align="char" char="." valign="top">1 (3.6)</td><td align="char" char="." valign="top">0 (0)</td></tr></tbody></table></table-wrap></sec><sec id="s3-2"><title>Machine Learning Features and Algorithms</title><p>The model 1 was analyzed using 6 machine learning algorithms, with LR incorporating recursive feature elimination and cross-validation demonstrating the best performance, yielding a mean accuracy of 0.66 (SD 0.02) and a mean AUROC of 0.73 (SD 0.01; <xref ref-type="table" rid="table3">Table 3</xref>).</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Performance of the predication model for models 1 and 2.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Algorithm</td><td align="left" valign="bottom">Accuracy, mean (SD)</td><td align="left" valign="bottom">AUROC<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup>, mean (SD)</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="3">Model 1</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>RF<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup></td><td align="char" char="." valign="top">0.60 (0.02)</td><td align="char" char="." valign="top">0.62 (0.04)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>LR<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup></td><td align="char" char="." valign="top">0.66 (0.01)</td><td align="char" char="." valign="top">0.72 (0.02)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SVM<sup><xref ref-type="table-fn" rid="table3fn4">d</xref></sup></td><td align="char" char="." valign="top">0.60 (0.02)</td><td align="char" char="." valign="top">0.64 (0.04)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>XGB<sup><xref ref-type="table-fn" rid="table3fn5">e</xref></sup></td><td align="char" char="." valign="top">0.63 (0.02)</td><td align="char" char="." valign="top">0.67 (0.03)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>LR with RFECV<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup></td><td align="char" char="." valign="top"><italic>0.66 (0.02)<sup><xref ref-type="table-fn" rid="table3fn7">g</xref></sup></italic></td><td align="char" char="." valign="top"><italic>0.73 (0.01)</italic></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>XGB with RFECV</td><td align="char" char="." valign="top">0.65 (0.02)</td><td align="char" char="." valign="top">0.70 (0.01)</td></tr><tr><td align="left" valign="top" colspan="3">Model 2</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>RF</td><td align="char" char="." valign="top">0.61 (0.02)</td><td align="char" char="." valign="top">0.64 (0.03)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>LR</td><td align="char" char="." valign="top">0.66 (0.02)</td><td align="char" char="." valign="top">0.72 (0.02)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SVM</td><td align="char" char="." valign="top">0.59 (0.01)</td><td align="char" char="." valign="top">0.59 (0.05)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>XGB</td><td align="char" char="." valign="top">0.64 (0.01)</td><td align="char" char="." valign="top">0.68 (0.02)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>LR with RFECV</td><td align="char" char="." valign="top"><italic>0.67 (0.01)</italic></td><td align="char" char="." valign="top"><italic>0.73 (0.01)</italic></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>XGB with RFECV</td><td align="char" char="." valign="top">0.66 (0.03)</td><td align="char" char="." valign="top">0.72 (0.01)</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>AUROC: area under the receiver operating characteristic curve.</p></fn><fn id="table3fn2"><p><sup>b</sup>RF: random forest.</p></fn><fn id="table3fn3"><p><sup>c</sup>LR: logistic regression.</p></fn><fn id="table3fn4"><p><sup>d</sup>SVM: support vector machine.</p></fn><fn id="table3fn5"><p><sup>e</sup>XGB: extreme gradient boosting.</p></fn><fn id="table3fn6"><p><sup>f</sup>RFECV: recursive feature elimination with cross-validation.</p></fn><fn id="table3fn7"><p><sup>g</sup>The values in italics format indicate that LR with RFECV demonstrated the best performance among all evaluated algorithms.</p></fn></table-wrap-foot></table-wrap><p>In model 2, additional variables, including laboratory test results and comorbidities, were integrated with the clinical parameters from model 1, resulting in a total of 29 variables. However, the inclusion of these additional variables did not significantly improve predictive performance, with a mean accuracy of 0.67 (SD 0.02) and a mean AUROC of 0.73 (SD 0.01; <xref ref-type="table" rid="table3">Table 3</xref>).</p><p>In model 3, the incorporation of breast sonography response data into the variables from the first model resulted in a dataset comprising 15 variables. Due to the limited sample size, the analysis used the LR algorithm with LOO-CV. The findings demonstrated that the incorporation of sonography response enhanced the predictive accuracy of the model, with an accuracy of 0.68 and an AUROC of 0.60 for the sonography group, as opposed to an accuracy of 0.66 and an AUROC of 0.55 for the nonsonography group. Furthermore, a SHAP value for sonography response was 0.62 (<xref ref-type="fig" rid="figure1">Figure 1</xref>), and the median rank of sonography response was 5 (IQR 3-7) among all samples in model 3 (<xref ref-type="fig" rid="figure2">Figure 2</xref>).</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>SHAP value for (A) without or (B) with breast sonography. CA15-3: carbohydrate antigen 15&#x2010;3; CEA: carcinoembryonic antigen; ER: estrogen receptor; HER2: human epidermal growth factor receptor 2; NBR: Nottingham Bloom Richardson; PR: progesterone receptor; SHAP: Shapley Additive Explanations.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cancer_v11i1e64685_fig01.png"/></fig><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Boxplot illustrating the ranking of sonography response across all samples in model 3. The median rank of sonography response was 5 (IQR 3-7).</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cancer_v11i1e64685_fig02.png"/></fig><p>Subsequent analysis of specific samples in model 3 was undertaken to investigate the value of sonography response (<xref ref-type="fig" rid="figure3">Figure 3</xref>). In sample 14, the predicted and true results were non-pCR; however, most variables predicted pCR, with only the sonography response correctly indicating non-pCR, aligning with the final result. A similar pattern was observed in samples 12, 26, and 27, where the predicted results were incongruent with the true outcomes; nevertheless, the sonography response accurately reflected the actual results.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Selected samples from model 3 highlighting the significance of sonography response in prediction accuracy. In sample 14, the true and predicted results were non-pCR, but most variables incorrectly predicted pCR&#x2014;except for the sonography response, which correctly indicated non-pCR. Similarly, in samples 12, 26, and 27, the predicted results were opposite to the actual outcomes; yet, the sonography response correctly aligned with the true results. CA15-3: carbohydrate antigen 15&#x2010;3; CEA: carcinoembryonic antigen; ER: estrogen receptor; HER2: human epidermal growth factor receptor 2; NBR: Nottingham Bloom Richardson; pCR: pathological complete response; PR: progesterone receptor; SHAP: Shapley Additive Explanations.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cancer_v11i1e64685_fig03.png"/></fig></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><p>The objective of this study was to develop machine learning&#x2013;based models to predict pCR in patients with breast cancer receiving neoadjuvant therapy, using clinical, laboratory, and imaging data. Three models were subjected to a rigorous testing process, and their predictive performance was thoroughly evaluated.</p><sec id="s4-1"><title>Principal Findings</title><p>Model 1 incorporated clinical parameters alone, yielding an AUROC of 0.73. Model 2, which added laboratory data and comorbidities, demonstrated no significant improvement over model 1. Model 3, which incorporated a further integration of breast sonography response, demonstrated a modest enhancement in its predictive performance. This enhancement was characterized by an increase in AUROC from 0.55 to 0.60 and an increase in accuracy from 0.66 to 0.68. Furthermore, SHAP analysis indicated that sonography response contributed significantly to the model, ranking fifth among all the features considered. In some cases, sonography response aligned with true outcomes, despite the failure of other variables to do so. These findings indicate the potential value of incorporating imaging data into prediction models to enhance individualized treatment strategies.</p></sec><sec id="s4-2"><title>Comparison to Prior Work</title><p>The predictive performance of model 1 is consistent with that reported in previous studies, which used clinical parameters alone and reported AUROCs ranging from 0.65 to 0.77 [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref21">21</xref>]. The limited incremental value observed in model 2 is consistent with the findings in the literature that laboratory and comorbidity variables may not independently enhance prediction unless integrated with molecular or genetic data [<xref ref-type="bibr" rid="ref21">21</xref>]. This study&#x2019;s finding that breast sonography provides added predictive value is consistent with previous evidence highlighting the clinical utility of imaging in assessing tumor response, as demonstrated in model 3.</p><p>The observed pCR rates for the different intrinsic subtypes (HER2-positive, TNBC, and hormone receptor&#x2013;positive) also reflect established trends in neoadjuvant therapy responsiveness [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref22">22</xref>-<xref ref-type="bibr" rid="ref25">25</xref>].</p></sec><sec id="s4-3"><title>Challenges With Small Sample Size and Machine Learning Approaches</title><p>Despite extensive data mining, only 41 cases with sonography response data were available for model 3, thereby limiting the sample size and potentially increasing the risk of overfitting. To address this issue, we used an LR model with LOO-CV, a method that has been demonstrated to be particularly effective when dealing with small datasets. Initially, algorithms such as support vector machines (and decision trees were considered; however, imbalances in the dataset led to classification bias, which resulted in the adoption of more straightforward LR models. It is recommended that future research endeavors place a priority on the acquisition of more substantial datasets with a view to enhancing the model&#x2019;s robustness and mitigating the risk of overfitting [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>].</p></sec><sec id="s4-4"><title>Clinical Implications</title><p>The predictive models developed in this study have practical applications in clinical decision-making. Specifically, model 1, which uses only baseline clinical data, facilitates initial treatment planning by predicting the likelihood of pCR subsequent to a decision to proceed with neoadjuvant therapy. The third model, which incorporates midtreatment sonography response, enables dynamic reassessment of pCR probability, facilitating timely adjustments to therapeutic strategies, such as switching to alternative treatments or surgical interventions. The integration of machine learning into standard clinical workflows may offer potential benefits for improving outcomes in breast cancer care (<xref ref-type="fig" rid="figure4">Figure 4</xref>). Given the small sample and lack of validation, the prediction model has not reached clinical maturity, and it is therefore not prudent to make recommendations regarding its application.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Conceptual flowchart outlining a potential application of the prediction model to support clinical decision-making. This framework is intended for illustrative purposes only and does not represent a validated clinical tool. pCR: pathological complete response.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cancer_v11i1e64685_fig04.png"/></fig></sec><sec id="s4-5"><title>Strengths and Limitations</title><p>A significant strength of this study is its multimodal approach, integrating clinical, laboratory, and imaging data within machine learning models. The use of SHAP values enhances interpretability and facilitates the identification of relevant predictors, including sonography response.</p><p>However, it is important to note several limitations of this study. First, the sample size for model 3 was limited (n=41), thereby restricting statistical power and increasing the risk of overfitting. To mitigate this issue, the LOO-CV and LR methods were applied. Second, the data extracted from semistructured reports may have been subject to inconsistencies. Despite the evident benefits of text mining in enhancing the quality of the results, the use of standardized data collection methods in future studies would be a preferred approach. Third, the models did not include genetic or molecular biomarkers, which may limit their predictive performance. Fourth, as a retrospective, single-center study, there is a risk of selection bias and limited generalizability. Variables with over 30% missing data were excluded, a process that potentially resulted in the omission of important predictors. Furthermore, the absence of external validation of the model is a notable shortcoming.</p></sec><sec id="s4-6"><title>Future Directions</title><p>Future research endeavors should explore the integration of genomic, molecular, and radiomic data to further refine prediction models. Conducting prospective, multi-institutional studies with larger and more diverse patient cohorts is imperative to validate findings and support generalizability. Standardizing imaging report formats and leveraging natural language processing tools may also enhance data quality for imaging-based predictors. Consequently, these advancements have the potential to facilitate the development of robust clinical decision-support tools, thereby optimizing neoadjuvant treatment planning in breast cancer care.</p></sec><sec id="s4-7"><title>Conclusions</title><p>This study provides preliminary insight into the potential role of breast sonography response data in improving pCR prediction for patients with breast cancer receiving neoadjuvant therapy. The clinical and laboratory parameters that were provided served as a useful foundation for the models, and the addition of imaging data appeared to offer modest improvements in predictive accuracy. However, given the relatively small sample size, these findings should be interpreted with caution. The incorporation of imaging data into clinical workflows could potentially represent a valuable step toward the development of more personalized treatment approaches.</p></sec></sec></body><back><ack><p>The authors would like to acknowledge the support of the Health Data Analytics and Statistics Center, Office of Data Science, Taipei Medical University, Taiwan, for their technical assistance. This study was supported by the National Science and Technology Council, Taiwan (project NSTC113-2321-B-038-012). The authors state that no generative artificial intelligence was used in the composition of this manuscript.</p></ack><notes><sec><title>Data Availability</title><p>The datasets generated and analyzed during this study are not publicly available due to institutional review board regulations at Taipei Medical University. The data are available from the Taipei Medical University Clinical Research Database for researchers who meet the criteria for access to confidential data. Requests for access can be directed to the corresponding author and will be subject to approval by Taipei Medical University.</p></sec></notes><fn-group><fn fn-type="con"><p>CCL was the primary contributor to data analysis and manuscript writing. CYC was responsible for image processing and contributed to data extraction and preprocessing. THC spearheaded the study direction.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AUROC</term><def><p>area under the receiver operating characteristic curve</p></def></def-item><def-item><term id="abb2">CA15-3</term><def><p>carbohydrate antigen 15&#x2010;3</p></def></def-item><def-item><term id="abb3">CEA</term><def><p>carcinoembryonic antigen</p></def></def-item><def-item><term id="abb4">ER</term><def><p>estrogen receptor</p></def></def-item><def-item><term id="abb5">HER2</term><def><p>human epidermal growth factor receptor 2</p></def></def-item><def-item><term id="abb6">IRB</term><def><p>institutional review board</p></def></def-item><def-item><term id="abb7">LOO-CV</term><def><p>leave-one-out cross-validation</p></def></def-item><def-item><term id="abb8">LR</term><def><p>logistic regression</p></def></def-item><def-item><term id="abb9">NBR</term><def><p>Nottingham Bloom Richardson</p></def></def-item><def-item><term id="abb10">pCR</term><def><p>pathological complete response</p></def></def-item><def-item><term id="abb11">PR</term><def><p>progesterone receptor</p></def></def-item><def-item><term id="abb12">SHAP</term><def><p>Shapley Additive Explanations</p></def></def-item><def-item><term id="abb13">TMU-CRD</term><def><p>Taipei Medical University Clinical Research Database</p></def></def-item><def-item><term id="abb14">TNBC</term><def><p>triple-negative breast cancer</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bray</surname><given-names>F</given-names> </name><name name-style="western"><surname>Laversanne</surname><given-names>M</given-names> </name><name name-style="western"><surname>Sung</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Global cancer statistics 2022: GLOBOCAN estimates of incidence and mortality worldwide for 36 cancers in 185 countries</article-title><source>CA Cancer J Clin</source><year>2024</year><volume>74</volume><issue>3</issue><fpage>229</fpage><lpage>263</lpage><pub-id pub-id-type="doi">10.3322/caac.21834</pub-id><pub-id pub-id-type="medline">38572751</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="report"><article-title>Taiwan Cancer Registry Annual Report 2022</article-title><year>2024</year><access-date>2025-06-17</access-date><publisher-name>Health Promotion Administration, Ministry of Health and Welfare</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://www.hpa.gov.tw/Pages/List.aspx?nodeid=119">https://www.hpa.gov.tw/Pages/List.aspx?nodeid=119</ext-link></comment></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nounou</surname><given-names>MI</given-names> </name><name name-style="western"><surname>ElAmrawy</surname><given-names>F</given-names> </name><name name-style="western"><surname>Ahmed</surname><given-names>N</given-names> </name><name name-style="western"><surname>Abdelraouf</surname><given-names>K</given-names> </name><name name-style="western"><surname>Goda</surname><given-names>S</given-names> </name><name name-style="western"><surname>Syed-Sha-Qhattal</surname><given-names>H</given-names> </name></person-group><article-title>Breast cancer: conventional diagnosis and treatment modalities and recent patents and technologies</article-title><source>Breast Cancer (Auckl)</source><year>2015</year><volume>9</volume><issue>Suppl 2</issue><fpage>17</fpage><lpage>34</lpage><pub-id pub-id-type="doi">10.4137/BCBCR.S29420</pub-id><pub-id pub-id-type="medline">26462242</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cuniolo</surname><given-names>L</given-names> </name><name name-style="western"><surname>Gipponi</surname><given-names>M</given-names> </name><name name-style="western"><surname>Murelli</surname><given-names>F</given-names> </name><etal/></person-group><article-title>Multidisciplinary and tailored treatment of locally advanced breast cancer in progression during neoadjuvant chemotherapy: case report</article-title><source>Curr Oncol</source><year>2024</year><month>05</month><day>16</day><volume>31</volume><issue>5</issue><fpage>2856</fpage><lpage>2866</lpage><pub-id pub-id-type="doi">10.3390/curroncol31050217</pub-id><pub-id pub-id-type="medline">38785498</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Korde</surname><given-names>LA</given-names> </name><name name-style="western"><surname>Somerfield</surname><given-names>MR</given-names> </name><name name-style="western"><surname>Carey</surname><given-names>LA</given-names> </name><etal/></person-group><article-title>Neoadjuvant chemotherapy, endocrine therapy, and targeted therapy for breast cancer: ASCO guideline</article-title><source>J Clin Oncol</source><year>2021</year><month>05</month><day>1</day><volume>39</volume><issue>13</issue><fpage>1485</fpage><lpage>1505</lpage><pub-id pub-id-type="doi">10.1200/JCO.20.03399</pub-id><pub-id pub-id-type="medline">33507815</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cortazar</surname><given-names>P</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>L</given-names> </name><name name-style="western"><surname>Untch</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Pathological complete response and long-term clinical benefit in breast cancer: the CTNeoBC pooled analysis</article-title><source>Lancet</source><year>2014</year><month>07</month><day>12</day><volume>384</volume><issue>9938</issue><fpage>164</fpage><lpage>172</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(13)62422-8</pub-id><pub-id pub-id-type="medline">24529560</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Huang</surname><given-names>M</given-names> </name><name name-style="western"><surname>O&#x2019;Shaughnessy</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zhao</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Evaluation of pathologic complete response as a surrogate for long-term survival outcomes in triple-negative breast cancer</article-title><source>J Natl Compr Canc Netw</source><year>2020</year><month>08</month><volume>18</volume><issue>8</issue><fpage>1096</fpage><lpage>1104</lpage><pub-id pub-id-type="doi">10.6004/jnccn.2020.7550</pub-id><pub-id pub-id-type="medline">32755985</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Swain</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Macharia</surname><given-names>H</given-names> </name><name name-style="western"><surname>Cortes</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Event-free survival in patients with early HER2-positive breast cancer with a pathological complete response after HER2-targeted therapy: a pooled analysis</article-title><source>Cancers (Basel)</source><year>2022</year><month>10</month><day>15</day><volume>14</volume><issue>20</issue><fpage>5051</fpage><pub-id pub-id-type="doi">10.3390/cancers14205051</pub-id><pub-id pub-id-type="medline">36291835</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="web"><article-title>NCCN clinical practice guidelines in oncology: breast cancer. Version 5.2023</article-title><source>National Comprehensive Cancer Network</source><year>2023</year><access-date>2025-06-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.nccn.org/professionals/physician_gls/pdf/breast.pdf">https://www.nccn.org/professionals/physician_gls/pdf/breast.pdf</ext-link></comment></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tolaney</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Barry</surname><given-names>WT</given-names> </name><name name-style="western"><surname>Dang</surname><given-names>CT</given-names> </name><etal/></person-group><article-title>Adjuvant paclitaxel and trastuzumab for node-negative, HER2-positive breast cancer</article-title><source>N Engl J Med</source><year>2015</year><month>01</month><day>8</day><volume>372</volume><issue>2</issue><fpage>134</fpage><lpage>141</lpage><pub-id pub-id-type="doi">10.1056/NEJMoa1406281</pub-id><pub-id pub-id-type="medline">25564897</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sikov</surname><given-names>WM</given-names> </name><name name-style="western"><surname>Berry</surname><given-names>DA</given-names> </name><name name-style="western"><surname>Perou</surname><given-names>CM</given-names> </name><etal/></person-group><article-title>Impact of the addition of carboplatin and/or bevacizumab to neoadjuvant once-per-week paclitaxel followed by dose-dense doxorubicin and cyclophosphamide on pathologic complete response rates in stage II to III triple-negative breast cancer: CALGB 40603 (Alliance)</article-title><source>J Clin Oncol</source><year>2015</year><month>01</month><day>1</day><volume>33</volume><issue>1</issue><fpage>13</fpage><lpage>21</lpage><pub-id pub-id-type="doi">10.1200/JCO.2014.57.0572</pub-id><pub-id pub-id-type="medline">25092775</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Schmid</surname><given-names>P</given-names> </name><name name-style="western"><surname>Cortes</surname><given-names>J</given-names> </name><name name-style="western"><surname>Pusztai</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Pembrolizumab for early triple-negative breast cancer</article-title><source>N Engl J Med</source><year>2020</year><month>02</month><day>27</day><volume>382</volume><issue>9</issue><fpage>810</fpage><lpage>821</lpage><pub-id pub-id-type="doi">10.1056/NEJMoa1910549</pub-id><pub-id pub-id-type="medline">32101663</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sammut</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>Crispin-Ortuzar</surname><given-names>M</given-names> </name><name name-style="western"><surname>Chin</surname><given-names>SF</given-names> </name><etal/></person-group><article-title>Multi-omic machine learning predictor of breast cancer therapy response</article-title><source>Nature New Biol</source><year>2022</year><month>01</month><volume>601</volume><issue>7894</issue><fpage>623</fpage><lpage>629</lpage><pub-id pub-id-type="doi">10.1038/s41586-021-04278-5</pub-id><pub-id pub-id-type="medline">34875674</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Romeo</surname><given-names>V</given-names> </name><name name-style="western"><surname>Accardo</surname><given-names>G</given-names> </name><name name-style="western"><surname>Perillo</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Assessment and prediction of response to neoadjuvant chemotherapy in breast cancer: a comparison of imaging modalities and future perspectives</article-title><source>Cancers (Basel)</source><year>2021</year><month>07</month><day>14</day><volume>13</volume><issue>14</issue><fpage>3521</fpage><pub-id pub-id-type="doi">10.3390/cancers13143521</pub-id><pub-id pub-id-type="medline">34298733</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dasgupta</surname><given-names>A</given-names> </name><name name-style="western"><surname>DiCenzo</surname><given-names>D</given-names> </name><name name-style="western"><surname>Sannachi</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Quantitative ultrasound radiomics guided adaptive neoadjuvant chemotherapy in breast cancer: early results from a randomized feasibility study</article-title><source>Front Oncol</source><year>2024</year><volume>14</volume><issue>1273437</issue><fpage>1273437</fpage><pub-id pub-id-type="doi">10.3389/fonc.2024.1273437</pub-id><pub-id pub-id-type="medline">38706611</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>ZJ</given-names> </name><name name-style="western"><surname>Xin</surname><given-names>F</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>ZJ</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Cao</surname><given-names>XC</given-names> </name></person-group><article-title>Real-world data on neoadjuvant chemotherapy with dual-anti HER2 therapy in HER2 positive breast cancer</article-title><source>BMC Cancer</source><year>2024</year><month>01</month><day>25</day><volume>24</volume><issue>1</issue><fpage>134</fpage><pub-id pub-id-type="doi">10.1186/s12885-024-11871-0</pub-id><pub-id pub-id-type="medline">38273267</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Haque</surname><given-names>W</given-names> </name><name name-style="western"><surname>Verma</surname><given-names>V</given-names> </name><name name-style="western"><surname>Hatch</surname><given-names>S</given-names> </name><name name-style="western"><surname>Suzanne Klimberg</surname><given-names>V</given-names> </name><name name-style="western"><surname>Brian Butler</surname><given-names>E</given-names> </name><name name-style="western"><surname>Teh</surname><given-names>BS</given-names> </name></person-group><article-title>Response rates and pathologic complete response by breast cancer molecular subtype following neoadjuvant chemotherapy</article-title><source>Breast Cancer Res Treat</source><year>2018</year><month>08</month><volume>170</volume><issue>3</issue><fpage>559</fpage><lpage>567</lpage><pub-id pub-id-type="doi">10.1007/s10549-018-4801-3</pub-id><pub-id pub-id-type="medline">29693228</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hanna</surname><given-names>MG</given-names> </name><name name-style="western"><surname>Olson</surname><given-names>NH</given-names> </name><name name-style="western"><surname>Zarella</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Recommendations for performance evaluation of machine learning in pathology: a concept paper from the College of American Pathologists</article-title><source>Arch Pathol Lab Med</source><year>2024</year><month>10</month><day>1</day><volume>148</volume><issue>10</issue><fpage>e335</fpage><lpage>e361</lpage><pub-id pub-id-type="doi">10.5858/arpa.2023-0042-CP</pub-id><pub-id pub-id-type="medline">38041522</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Basmadjian</surname><given-names>RB</given-names> </name><name name-style="western"><surname>Kong</surname><given-names>S</given-names> </name><name name-style="western"><surname>Boyne</surname><given-names>DJ</given-names> </name><etal/></person-group><article-title>Developing a prediction model for pathologic complete response following neoadjuvant chemotherapy in breast cancer: a comparison of model building approaches</article-title><source>JCO Clin Cancer Inform</source><year>2022</year><month>02</month><volume>6</volume><fpage>e2100055</fpage><pub-id pub-id-type="doi">10.1200/CCI.21.00055</pub-id><pub-id pub-id-type="medline">35148170</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kim</surname><given-names>JY</given-names> </name><name name-style="western"><surname>Jeon</surname><given-names>E</given-names> </name><name name-style="western"><surname>Kwon</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Prediction of pathologic complete response to neoadjuvant chemotherapy using machine learning models in patients with breast cancer</article-title><source>Breast Cancer Res Treat</source><year>2021</year><month>10</month><volume>189</volume><issue>3</issue><fpage>747</fpage><lpage>757</lpage><pub-id pub-id-type="doi">10.1007/s10549-021-06310-8</pub-id><pub-id pub-id-type="medline">34224056</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kim</surname><given-names>I</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>K</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>SA</given-names> </name><name name-style="western"><surname>Park</surname><given-names>YH</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>SK</given-names> </name></person-group><article-title>A predictive model for pathologic complete response in breast cancer patients treated with neoadjuvant chemotherapy using machine learning</article-title><source>Adv Breast Cancer Res</source><year>2021</year><volume>10</volume><issue>4</issue><fpage>141</fpage><lpage>155</lpage><pub-id pub-id-type="doi">10.4236/abcr.2021.104012</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Johnson</surname><given-names>KS</given-names> </name><name name-style="western"><surname>Conant</surname><given-names>EF</given-names> </name><name name-style="western"><surname>Soo</surname><given-names>MS</given-names> </name></person-group><article-title>Molecular subtypes of breast cancer: a review for breast radiologists</article-title><source>J Breast Imaging</source><year>2021</year><month>01</month><day>26</day><volume>3</volume><issue>1</issue><fpage>12</fpage><lpage>24</lpage><pub-id pub-id-type="doi">10.1093/jbi/wbaa110</pub-id><pub-id pub-id-type="medline">38424845</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jagosky</surname><given-names>M</given-names> </name><name name-style="western"><surname>Tan</surname><given-names>AR</given-names> </name></person-group><article-title>Combination of pertuzumab and trastuzumab in the treatment of HER2-positive early breast cancer: a review of the emerging clinical data</article-title><source>Breast Cancer (Dove Med Press)</source><year>2021</year><volume>13</volume><fpage>393</fpage><lpage>407</lpage><pub-id pub-id-type="doi">10.2147/BCTT.S176514</pub-id><pub-id pub-id-type="medline">34163239</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Agostinetto</surname><given-names>E</given-names> </name><name name-style="western"><surname>Curigliano</surname><given-names>G</given-names> </name><name name-style="western"><surname>Piccart</surname><given-names>M</given-names> </name></person-group><article-title>Emerging treatments in HER2-positive advanced breast cancer: keep raising the bar</article-title><source>Cell Rep Med</source><year>2024</year><month>06</month><day>18</day><volume>5</volume><issue>6</issue><fpage>101575</fpage><pub-id pub-id-type="doi">10.1016/j.xcrm.2024.101575</pub-id><pub-id pub-id-type="medline">38759648</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Boughey</surname><given-names>JC</given-names> </name><name name-style="western"><surname>Hoskin</surname><given-names>TL</given-names> </name><name name-style="western"><surname>Goetz</surname><given-names>MP</given-names> </name></person-group><article-title>Neoadjuvant chemotherapy and nodal response rates in luminal breast cancer: effects of age and tumor Ki67</article-title><source>Ann Surg Oncol</source><year>2022</year><month>09</month><volume>29</volume><issue>9</issue><fpage>5747</fpage><lpage>5756</lpage><pub-id pub-id-type="doi">10.1245/s10434-022-11871-z</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kokol</surname><given-names>P</given-names> </name><name name-style="western"><surname>Kokol</surname><given-names>M</given-names> </name><name name-style="western"><surname>Zagoranski</surname><given-names>S</given-names> </name></person-group><article-title>Machine learning on small size samples: a synthetic knowledge synthesis</article-title><source>Sci Prog</source><year>2022</year><volume>105</volume><issue>1</issue><fpage>368504211029777</fpage><pub-id pub-id-type="doi">10.1177/00368504211029777</pub-id><pub-id pub-id-type="medline">35220816</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xu</surname><given-names>P</given-names> </name><name name-style="western"><surname>Ji</surname><given-names>X</given-names> </name><name name-style="western"><surname>Li</surname><given-names>M</given-names> </name><name name-style="western"><surname>Lu</surname><given-names>W</given-names> </name></person-group><article-title>Small data machine learning in materials science</article-title><source>npj Comput Mater</source><year>2023</year><volume>9</volume><issue>1</issue><pub-id pub-id-type="doi">10.1038/s41524-023-01000-z</pub-id></nlm-citation></ref></ref-list></back></article>