<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id><journal-id journal-id-type="publisher-id">medinform</journal-id><journal-id journal-id-type="index">7</journal-id><journal-title>JMIR Medical Informatics</journal-title><abbrev-journal-title>JMIR Med Inform</abbrev-journal-title><issn pub-type="epub">2291-9694</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v13i1e64725</article-id><article-id pub-id-type="doi">10.2196/64725</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>A Machine Learning Approach to Differentiate Cold and Hot Syndrome in Viral Pneumonia Integrating Traditional Chinese Medicine and Modern Medicine: Machine Learning Model Development and Validation</article-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Jin</surname><given-names>Xiaojie</given-names></name><degrees>Prof Dr</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Wang</surname><given-names>Yanru</given-names></name><degrees>Dr med</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Wang</surname><given-names>Jiarui</given-names></name><degrees>MM</degrees><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Gao</surname><given-names>Qian</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Huang</surname><given-names>Yuhan</given-names></name><degrees>MM</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Shao</surname><given-names>Lingyu</given-names></name><degrees>MM</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Zhao</surname><given-names>Jiali</given-names></name><degrees>MM</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Li</surname><given-names>Jintian</given-names></name><degrees>Prof Dr</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Li</surname><given-names>Ling</given-names></name><degrees>Prof Dr</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Zhang</surname><given-names>Zhiming</given-names></name><degrees>Prof Dr Med</degrees><xref ref-type="aff" rid="aff5">5</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Li</surname><given-names>Shuyan</given-names></name><degrees>Prof Dr</degrees><xref ref-type="aff" rid="aff4">4</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" corresp="yes" equal-contrib="yes"><name name-style="western"><surname>Liu</surname><given-names>Yongqi</given-names></name><degrees>Prof Dr, Prof Dr Med</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib></contrib-group><aff id="aff1"><institution>Key Laboratory of Dunhuang Medicine, Ministry of Education, Gansu University of Chinese Medicine</institution><addr-line>Dingxi East Road, 35th</addr-line><addr-line>Lanzhou</addr-line><country>China</country></aff><aff id="aff2"><institution>College of Pharmacy, Gansu University of Chinese Medicine</institution><addr-line>Lanzhou</addr-line><country>China</country></aff><aff id="aff3"><institution>The Second Affiliated Hospital of Xuzhou Medical University</institution><addr-line>Xuzhou</addr-line><country>China</country></aff><aff id="aff4"><institution>School of Medical Information and Engineering, Xuzhou Medical University</institution><addr-line>Xuzhou</addr-line><country>China</country></aff><aff id="aff5"><institution>Gansu Provincial Hospital of Traditional Chinese Medicine</institution><addr-line>Lanzhou</addr-line><country>China</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Benis</surname><given-names>Arriel</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Hwang</surname><given-names>Feng-Nan</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Hu</surname><given-names>Guang</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Jain</surname><given-names>Prince</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Li</surname><given-names>Yinghong</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Yongqi Liu, Prof Dr, Prof Dr Med, Key Laboratory of Dunhuang Medicine, Ministry of Education, Gansu University of Chinese Medicine, Dingxi East Road, 35th, Lanzhou, 730000, China, 86 13919019578; <email>liuyongqi73@163.com</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>16</day><month>7</month><year>2025</year></pub-date><volume>13</volume><elocation-id>e64725</elocation-id><history><date date-type="received"><day>25</day><month>07</month><year>2024</year></date><date date-type="rev-recd"><day>03</day><month>05</month><year>2025</year></date><date date-type="accepted"><day>09</day><month>05</month><year>2025</year></date></history><copyright-statement>&#x00A9; Xiaojie Jin, Yanru Wang, Jiarui Wang, Qian Gao, Yuhan Huang, Lingyu Shao, Jiali Zhao, Jintian Li, Ling Li, Zhiming Zhang, Shuyan Li, Yongqi Liu. Originally published in JMIR Medical Informatics (<ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org">https://medinform.jmir.org</ext-link>), 16.7.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/">https://medinform.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://medinform.jmir.org/2025/1/e64725"/><abstract><sec><title>Background</title><p>Syndrome differentiation in traditional Chinese medicine (TCM) is an ancient principle that guides disease diagnosis and treatment. Among these, the cold and hot syndromes play a crucial role in identifying the nature of the disease and guiding the treatment of viral pneumonia. However, differentiating between cold and hot syndromes is often considered esoteric. Machine learning offers a promising avenue for clinicians to identify these syndromes more accurately, thereby supporting more informed clinical decision-making in the treatment.</p></sec><sec><title>Objective</title><p>This study aims to construct a diagnostic model for differentiating cold and hot syndromes in viral pneumonia by integrating TCM and modern medical features using machine learning methods.</p></sec><sec sec-type="methods"><title>Methods</title><p>The application of 8 machine learning algorithms (gradient boosting machine [GBM], logistic regression, random forest, extreme gradient boosting [XGB], light gradient boosting machine [LGB], ridge regression, least absolute shrinkage and selection operator, and support vector machine) generated and validated (both internally and externally) a model for differentiating cold and hot syndromes in viral pneumonia, based on clinical data from 1484 patient samples collected at 2 medical centers between 2021 and 2022.</p></sec><sec sec-type="results"><title>Results</title><p>The GBM model, which combines TCM and modern medicine features, outperformed models using only TCM features or only modern medicine features in distinguishing cold and hot syndromes in patients with viral pneumonia. The optimal discrimination model comprised 13 optimal features (temperature, red cell distribution width-SD, creatinine, total bilirubin, globulin, C-reactive protein, unconjugated bilirubin, white blood cell, neutrophil percentage, aspartate transaminase/alanine transaminase, total cholesterol, thrombocytocrit, and age) and the GBM algorithm, achieving an area under the curve (AUC) of 0.7788. Under internal and external testing, the AUCs were 0.7645 and 0.8428, respectively. Moreover, significant differences were observed between the cold and hot syndrome groups in temperature (<italic>P</italic>=.02), red cell distribution width-SD (<italic>P</italic>&#x003C;.001), neutrophil percentage (<italic>P</italic>=.01), total cholesterol (<italic>P</italic>=.003), thrombocytocrit (<italic>P</italic>&#x003C;.001), and age (<italic>P</italic>&#x003C;.001).</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>This pioneering study integrates the theory of TCM cold and hot syndromes with modern laboratory-based tests through machine learning. The developed model offers a novel approach for differentiating cold and hot syndromes in viral pneumonia, enabling practitioners to identify the syndrome quickly and efficiently, thereby supporting more informed clinical decision-making. Additionally, this research provides new insights into the modernization and scientific interpretation of TCM syndrome differentiation.</p></sec></abstract><kwd-group><kwd>syndrome differentiation</kwd><kwd>traditional Chinese medicine</kwd><kwd>viral pneumonia</kwd><kwd>dialectical treatment</kwd><kwd>machine learning</kwd><kwd>Chinese medicine</kwd><kwd>pneumonia</kwd><kwd>lungs</kwd><kwd>diagnostic model</kwd><kwd>retrospective study</kwd><kwd>artificial intelligence</kwd><kwd>China</kwd><kwd>model training</kwd><kwd>performance evaluation</kwd><kwd>laboratory tests</kwd><kwd>modern medicine</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Traditional Chinese medicine (TCM), a personalized and holistic approach, treats diseases using natural medical products tailored to a patient&#x2019;s TCM syndrome patterns [<xref ref-type="bibr" rid="ref1">1</xref>], that is, dialectical treatment of TCM. Specifically, TCM syndrome, a concept unique to TCM, is an abstraction of a variety of signs and symptoms. Dialectical treatment is the fundamental principle by which physicians diagnose, understand, and treat diseases. It involves comprehensively collecting patients&#x2019; clinical signs and symptoms through &#x201C;inspection, auscultation, olfaction, inquiry, and palpation&#x201D; to determine the TCM syndrome pattern. Subsequently, corresponding therapies, such as acupuncture, cupping, qigong, massage, and diet, are selected [<xref ref-type="bibr" rid="ref2">2</xref>] to correct maladjustments and restore the body&#x2019;s self-regulatory ability [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. Guided by this unique principle, TCM has demonstrated remarkable clinical efficacy in treating various acute and chronic diseases, thus attracting increasing attention [<xref ref-type="bibr" rid="ref5">5</xref>]. Especially in the fight against viral pneumonia, the importance of TCM has been widely recognized [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. Consequently, promptly and accurately understanding the TCM syndrome pattern of a disease can reshape global health and welfare.</p><p>In recent years, with the successive outbreaks of SARS, influenza A (H1N1), influenza A (H7N9), COVID-19, and other viruses, viral pneumonia has become a sustained and widespread disease burden in many countries and globally. As with other diseases, the accurate identification of syndrome patterns is a prerequisite for the TCM-based prevention and treatment of viral pneumonia. Numerous studies have reported that the cold and hot syndromes are the pivotal TCM syndrome patterns in cases of viral pneumonia, such as SARS and COVID-19 [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref10">10</xref>]. Cold and hot syndromes, originating from the <italic>Huangdi Neijing,</italic> are 2 key components of the Eight Principle Syndromes&#x2014;the general principles of dialectical treatment, which include cold and hot, sthenia and asthenia, exterior and interior, and yin and yang&#x2014;and are used to identify the nature of a disease, reflecting disruptions in body homeostasis [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref13">13</xref>]. Cold syndrome&#x2013;related expressions include coldness, cold pain, tastelessness, and clear, abundant urine, whereas hot syndrome is mainly characterized by heat, diaphoresis, a flushed face, burning pain, and deep-colored urine. The cold and hot syndrome framework has been widely applied in the diagnosis and treatment of viral pneumonia. Treating cold and hot syndromes within TCM has been shown to significantly alleviate clinical symptoms in patients with viral pneumonia [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. For example, symptomatic treatments with Chinese medicines such as Lianhua Qingwen capsules and Xuanfeibaidu granules can markedly reduce the incidence of severe or critical events and improve clinical recovery [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>], indicating that the prediction and differentiation of cold and hot syndromes play a vital role in the treatment of viral pneumonia.</p><p>Nevertheless, although clinical data and studies have indicated that TCM treatments for the cold and hot syndromes of viral pneumonia are effective, a major challenge remains in distinguishing between these syndromes&#x2014;similar to the challenges in identifying other TCM syndrome patterns. Specifically, (1) the differentiation of cold and hot syndrome is recondite and lacks a solid scientific foundation in classical TCM theory, and (2) the accuracy of cold and hot syndrome diagnosis in TCM relies heavily on the physicians&#x2019; skills and years of clinical experience. Subjective factors play a decisive role in TCM diagnosis, which inevitably leads to a lack of standardized criteria and an objective diagnostic basis for cold and hot syndromes. This unique diagnostic model not only supports the open and divergent development of TCM, but also hinders the understanding of cold and hot syndromes in viral pneumonia from a modern biomedical perspective. It further restricts the domestic and international dissemination of TCM syndrome differentiation, making it one of the key bottlenecks in the development of TCM. Therefore, in the process of integrating TCM with modern medicine, it is worth considering how to combine TCM syndrome theory with modern medicine to enhance the scientific rigor and objectivity of cold and hot syndrome differentiation in the treatment of viral pneumonia.</p><p>Recently, with the rapid development of machine learning [<xref ref-type="bibr" rid="ref15">15</xref>-<xref ref-type="bibr" rid="ref18">18</xref>], artificial intelligence has brought unprecedented challenges and opportunities to the diagnosis of TCM syndrome. Interdisciplinary models combining TCM and artificial intelligence have been proposed to model TCM knowledge, diagnosis, and treatment in clinical practice. Among these, numerous models have been developed to simulate the syndrome differentiation process of human TCM doctors for automatic syndrome diagnosis. For example, Huang et al [<xref ref-type="bibr" rid="ref19">19</xref>] successfully identified the liver-gallbladder dampness-heat syndrome in patients with breast cancer using a dataset based on the prescriptions of TCM clinical practitioners. Zhuo et al [<xref ref-type="bibr" rid="ref20">20</xref>] effectively differentiated Qi deficiency blood stasis syndrome and phlegm stasis in channels syndrome in patients with stroke through artificial intelligence&#x2013;assisted retinal feature analysis. These examples demonstrate that machine learning enables a modern interpretation of the scientific connotation of TCM syndrome differentiation, supporting improved clinical decision-making in disease treatment. However, currently, there is still a lack of machine learning&#x2013;based differentiation of cold and hot syndromes in viral pneumonia.</p><p>Among the machine learning algorithms in artificial intelligence, gradient boosting machine (GBM), logistic regression (LR), random forest (RF), extreme gradient boosting (XGB), and light gradient boosting machine (LGB), among others, have demonstrated promising performance [<xref ref-type="bibr" rid="ref21">21</xref>-<xref ref-type="bibr" rid="ref24">24</xref>]. Consequently, this study aimed to compare 8 machine learning methods, namely, GBM, LR, RF, XGB, LGB, ridge regression (RIDGE), least absolute shrinkage and selection operator (LASSO), and support vector machine (SVM), by integrating laboratory test indicators from modern medicine with the TCM cold and hot syndrome, to explore the connection between them and construct a diagnostic model for differentiating the cold and hot syndromes in viral pneumonia. This approach seeks to provide a new diagnostic method for the clinical differentiation of cold and hot syndromes in viral pneumonia and to offer new perspectives for the scientization, standardization, and objectivity of TCM syndrome differentiation theory in guiding treatment.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Source of Materials</title><p>In this study, a retrospective review of case sheets was conducted on samples from 1401 patients diagnosed with viral pneumonia between January 18 and November 6, 2021, at the Second People&#x2019;s Hospital of Lanzhou City in China. Samples were excluded based on the following criteria: (1) the diagnosis was not made using the Eight Principle Syndromes of TCM, and (2) the patient was diagnosed with both cold and hot syndrome patterns simultaneously. A total of 602 samples met the inclusion criteria. Samples with more than 20% (ie, 19/93 features) missing values were further excluded, resulting in 382 samples ultimately included for analysis. These comprised 97 negative samples (cold syndrome) and 285 positive samples (hot syndrome). Additionally, a stratified sampling strategy was applied to split the original dataset into training and internal test cohorts at an 8:2 ratio (details are provided in the &#x201C;Performance Evaluation and Model Validation&#x201D; section).</p><p>The external test cohort consisted of 83 patients with viral pneumonia diagnosed with either cold or hot syndrome at Lanzhou Heavy Ion Hospital between July and August 2022. This cohort included 36 patients with the hot syndrome and 47 patients with the cold syndrome.</p></sec><sec id="s2-2"><title>TCM and Modern Medicine Features Collection and Cold and Hot Syndrome Diagnosis</title><p>As shown in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, a total of 93 features related to TCM and modern medicine were collected in this study, including 4 general information items, 19 TCM symptoms, 2 blood gas values, 10 viral pneumonia indicators, 27 biochemical indicators, 30 blood routine indicators, and 1 coagulation indicator. Among these, patients&#x2019; TCM symptoms were further quantified using a TCM symptom scoring scale for viral pneumonia (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>).</p><p>All patients with viral pneumonia were independently diagnosed with either the TCM cold or hot syndrome by 2 TCM chief physicians. If both physicians provided the same diagnosis, the patient was enrolled. In cases of disagreement, a third investigator participated in the discussion to reach a consensus. The diagnostic criteria for syndrome differentiation were based on the textbooks <italic>TCM Diagnostics</italic> [<xref ref-type="bibr" rid="ref25">25</xref>] and <italic>Guiding Principles of Clinical Research on New Drugs of Traditional Chinese Medicine</italic> [<xref ref-type="bibr" rid="ref26">26</xref>]. These criteria include the 4 classical diagnostic methods used to determine TCM cold and hot syndrome patterns: inspection, auscultation, inquiry, and palpation, to accurately record the TCM characteristics.</p></sec><sec id="s2-3"><title>Model Training</title><p>In this study, 8 machine learning algorithms (GBM, LR, RF, XGB, LGB, RIDGE, LASSO, and SVM) were used to train a dataset containing all features, and GBM was selected as the final classification model. As shown in <xref ref-type="fig" rid="figure1">Figure 1</xref>, GBM operates on the principle of ensemble learning, constructing the final prediction model by iteratively training a series of weak learners, typically decision trees. The core mechanism of GBM lies in its ability to correct the prediction errors of previous decision trees. Each newly generated decision tree is trained to fit the residuals&#x2014;the differences between the actual values and the predicted values&#x2014;of the previous model, thereby continuously reducing the overall loss function. Specifically, GBM begins by constructing an initial decision tree based on the training data, and then calculates the prediction error of this tree. A second tree is built to model the residuals, with its predictions aimed at correcting the deficiencies of the first tree. This process continues iteratively until a preset number of iterations is reached or a stopping condition is met. <xref ref-type="fig" rid="figure1">Figure 1</xref> illustrates the structure and decision-making process of multiple decision trees in the GBM model. Each decision tree branches based on input features, and the final prediction is obtained through a weighted sum of the predictions from all individual trees.</p><p>The number of top-ranking indexes was gradually increased, and the hyperparameters n_estimators and max_depth were tuned. The final model consisted of 13 top-ranking features, with n_estimators and max_depth set to 797 and 8, respectively. The GBM was implemented using the scikit-learn library (version 0.24.1) in Python (version 3.8.8; Python Foundation).</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Gradient boosting machine decision tree composition and prediction flowchart.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e64725_fig01.png"/></fig></sec><sec id="s2-4"><title>Optimal Feature Ascertainment</title><p>&#x201C;Feature importance,&#x201D; &#x201C;coef,&#x201D; and &#x201C;SHAP values&#x201D; are 3 commonly used methods to assess the relationship between features and machine learning models, and they have received significant attention in recent research [<xref ref-type="bibr" rid="ref27">27</xref>]. These methods calculate the relevance of each feature to the model&#x2019;s predictions, which are then ranked in descending order to produce a feature importance ranking.</p><p>In tree-based models (eg, GBM, RF, XGB, LGB), feature importance is typically evaluated from 2 perspectives: split count and split gain. Split count refers to how often a particular feature is selected as a splitting point during tree construction; a higher count indicates greater importance. By contrast, split gain measures the improvement in the model&#x2019;s objective function (eg, squared error loss) resulting from splitting on a given feature. A larger gain implies a greater contribution to model performance and hence higher importance. Additionally, SHAP (Shapley Additive Explanations) values offer a unified measure of feature importance based on game theory by calculating the marginal contribution of each feature to the model&#x2019;s prediction. SHAP values provide both global and local interpretability of the model. In linear models (eg, RIDGE, LASSO, SVM, and LR), &#x201C;coef&#x201D; represents the coefficients assigned to each feature. These coefficients indicate the strength and direction of the linear relationship between each feature and the target variable. SHAP values can complement these coefficients by revealing nonlinear effects and feature interactions that may not be captured by standard linear models.</p><p>The insights gained from these methods, especially when combining traditional feature importance metrics with SHAP analysis, can aid researchers in uncovering hidden data patterns and insights, thereby supporting scientific investigations and informing practical applications. Accordingly, these methods are used to rank the feature importance for cold and hot syndromes of viral pneumonia and to ascertain the optimal features.</p></sec><sec id="s2-5"><title>Performance Evaluation and Model Validation</title><p>During the data preprocessing stage, a stratified sampling strategy was adopted to divide the original dataset, ensuring an 8:2 ratio between the training and validation sets. This approach preserved the proportional distribution of each class (cold and hot syndromes) as in the original dataset, thereby avoiding model evaluation bias due to imbalanced category distributions.</p><p>Given the relatively small sample size, 5-fold cross-validation was applied to ensure model accuracy and reliability. As illustrated in <xref ref-type="fig" rid="figure2">Figure 2</xref>, the dataset was divided into 5 nonoverlapping subsets of equal size. In each round of validation, 1 subset was selected as the validation set (the blue portion in the figure), while the remaining 4 subsets constituted the training set (gray portions). This process was repeated for 5 rounds. In the first round, the first subset was the validation set, and the remaining 4 were used as the training set, resulting in Performance<sub>&#x2081;</sub>. In the second round, the second subset was used for validation, and so on, resulting in Performance<sub>&#x2082;</sub> through Performance<sub>5</sub>. The final model performance was calculated as the average of these 5 evaluation results, with the formula <inline-formula><mml:math id="ieqn1"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">e</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">r</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">f</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">o</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">r</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">m</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">a</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">n</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">c</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">e</mml:mi></mml:mrow><mml:mrow><mml:mtext>&#x00A0;</mml:mtext></mml:mrow><mml:mo>=</mml:mo><mml:mrow><mml:mtext>&#x00A0;</mml:mtext></mml:mrow><mml:munderover><mml:mo movablelimits="false">&#x2211;</mml:mo><mml:mrow><mml:mrow><mml:mi mathvariant="normal">i</mml:mi></mml:mrow><mml:mrow><mml:mtext>&#x00A0;</mml:mtext></mml:mrow><mml:mo>=</mml:mo><mml:mrow><mml:mtext>&#x00A0;</mml:mtext></mml:mrow><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mn>5</mml:mn></mml:mrow></mml:munderover><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">e</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">r</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">f</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">o</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">r</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">m</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">a</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">n</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">c</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">e</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi mathvariant="normal">i</mml:mi></mml:mrow></mml:mrow></mml:msub></mml:mrow></mml:mstyle></mml:math></inline-formula>. This strategy ensured that each sample was used for both training and validation, reduced the variance caused by random sample division, and improved the robustness and reliability of the model evaluation [<xref ref-type="bibr" rid="ref28">28</xref>].</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>The 5-fold cross-validation process diagram.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e64725_fig02.png"/></fig><p>In addition, a comprehensive evaluation of the model was conducted using commonly used metrics, including sensitivity, specificity (SPE), accuracy (ACC), Matthews correlation coefficient (MCC), and area under the curve (AUC). These metrics are calculated based on the values of true positives (TPs), true negatives (TNs), false positives (FPs), and false negatives (FNs), as defined below:</p><disp-formula id="E1"><label>(1)</label><mml:math id="eqn1"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mtext>Sens</mml:mtext><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mo>+</mml:mo><mml:mi>F</mml:mi><mml:mi>N</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi></mml:mrow></mml:mfrac></mml:mrow></mml:mstyle></mml:math></disp-formula><disp-formula id="E2"><label>(2)</label><mml:math id="eqn2"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mtext>Spec</mml:mtext><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>T</mml:mi><mml:mi>N</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mi>N</mml:mi><mml:mo>+</mml:mo><mml:mi>F</mml:mi><mml:mi>P</mml:mi></mml:mrow></mml:mfrac></mml:mrow></mml:mstyle></mml:math></disp-formula><disp-formula id="E3"><label>(3)</label><mml:math id="eqn3"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mtext>ACC</mml:mtext><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mo>+</mml:mo><mml:mi>T</mml:mi><mml:mi>N</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mo>+</mml:mo><mml:mi>T</mml:mi><mml:mi>N</mml:mi><mml:mo>+</mml:mo><mml:mi>F</mml:mi><mml:mi>P</mml:mi><mml:mo>+</mml:mo><mml:mi>F</mml:mi><mml:mi>N</mml:mi></mml:mrow></mml:mfrac></mml:mrow></mml:mstyle></mml:math></disp-formula><disp-formula id="E4"> <label>(4)</label><mml:math id="eqn4"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mtext>MCC</mml:mtext><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mo>&#x22C5;</mml:mo><mml:mi>T</mml:mi><mml:mi>N</mml:mi><mml:mo>&#x2212;</mml:mo><mml:mi>F</mml:mi><mml:mi>P</mml:mi><mml:mo>&#x22C5;</mml:mo><mml:mi>F</mml:mi><mml:mi>N</mml:mi></mml:mrow><mml:msqrt><mml:mo stretchy="false">(</mml:mo><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mo>+</mml:mo><mml:mi>F</mml:mi><mml:mi>P</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo stretchy="false">(</mml:mo><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mo>+</mml:mo><mml:mi>F</mml:mi><mml:mi>N</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo stretchy="false">(</mml:mo><mml:mi>T</mml:mi><mml:mi>N</mml:mi><mml:mo>+</mml:mo><mml:mi>F</mml:mi><mml:mi>P</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo stretchy="false">(</mml:mo><mml:mi>T</mml:mi><mml:mi>N</mml:mi><mml:mo>+</mml:mo><mml:mi>F</mml:mi><mml:mi>N</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:msqrt></mml:mfrac></mml:mrow></mml:mstyle></mml:math></disp-formula><p>The receiver operating characteristic curve, also known as the sensitivity curve, is a graphical representation of the performance of a classification model across various evaluation thresholds. It plots the true-positive rate against the false-positive rate at different threshold settings. The true-positive rate reflects the proportion of actual positive cases correctly identified by the model, while the false-positive rate represents the proportion of negative cases incorrectly classified as positive. The AUC provides a single summary metric of the classifier&#x2019;s overall performance, with values ranging from 0 to 1. A higher AUC value indicates better classification performance. Therefore, AUC is widely used as a standard metric to evaluate the performance of classification models. The formula for calculating AUC is as follows:</p><disp-formula id="E5"><label>(5)</label><mml:math id="eqn5"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mtext>AUC</mml:mtext><mml:mo>=</mml:mo><mml:msubsup><mml:mo>&#x222B;</mml:mo><mml:mrow><mml:mn>0</mml:mn></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msubsup><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mi>R</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mtext>FDR</mml:mtext><mml:mo stretchy="false">)</mml:mo><mml:mtext>&#x00A0;</mml:mtext><mml:mi>d</mml:mi><mml:mtext>FDR</mml:mtext></mml:mrow></mml:mstyle></mml:math></disp-formula></sec><sec id="s2-6"><title>Ethical Considerations</title><p>The study was approved by the Medical Ethics Review Committee of the Second People&#x2019;s Hospital of Lanzhou City and Lanzhou Heavy Ion Hospital (approval number 2021-026-01). Informed consent was obtained on an opt-out basis, and all data were anonymized. No financial or material incentives were provided to participants.</p></sec><sec id="s2-7"><title>Statistical Analysis</title><p>All data were analyzed using SPSS version 27.0 (IBM Corp). Categorical variables are presented as counts and percentages, whereas continuous variables are reported as means and SDs or IQRs, as appropriate. Normality was assessed using the Kolmogorov-Smirnov test. Student 2-tailed <italic>t</italic> test was used to compare parametric continuous variables, while the Mann-Whitney <italic>U</italic> test was used for nonparametric variables, the  <italic>&#x03C7;</italic><sup>2</sup> test was applied for categorical variables, and the Fisher exact test was used for 2&#x00D7;2 contingency tables. Binomial distribution tests were performed for each feature within the cold syndrome and hot syndrome groups. No correction for multiple comparisons was applied. A 2-sided <italic>P</italic>&#x003C;.05 was considered statistically significant.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Data Extraction</title><p>We included only individual samples from patients with viral pneumonia and excluded those that were not diagnosed using the Eight Principle Syndromes (cold and hot, sthenia and asthenia, exterior and interior, and yin and yang), as well as those simultaneously diagnosed with cold and hot syndrome. A total of 602 eligible samples were retained. Samples with more than 20% (ie, 19/93 features) missing values were further excluded, and the remaining missing values were imputed using the median of each variable. Ultimately, 382 complete samples were included in the final analysis and used to construct the mathematical model. The dataset was split into training and testing sets in an 8:2 ratio. Subsequently, by integrating indicators from TCM and modern medicine and applying 8 machine learning algorithms, we identified the optimal model for differentiating TCM cold-hot syndromes in viral pneumonia through 5-fold cross-validation. The model&#x2019;s performance was further assessed using an external validation cohort. The data processing workflow and model construction process are illustrated in <xref ref-type="fig" rid="figure3">Figure 3</xref>.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Research flow for data processing and predictive model construction. After preliminary screening of the collected data, 382 samples of patients with viral pneumonia with TCM cold and hot syndromes were obtained. The dataset was randomly divided into training and test sets in an 8:2 ratio. Traditional Chinese medicine and modern medical indicators were extracted through data processing and statistical analysis. The performance of the 8 machine learning models (gradient boosting machine [GBM], logistic regression [LR], random forest [RF], extreme gradient boosting [XGB], light gradient boosting machine [LGB], ridge regression, least absolute shrinkage and selection operator [LASSO], and support vector machine [SVM]) was evaluated. Based on a comprehensive evaluation of all models, the optimal classification algorithm and feature set were identified. The final model&#x2019;s performance was further assessed using internal and external test cohorts.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e64725_fig03.png"/></fig></sec><sec id="s3-2"><title>Model Training Based on TCM and Modern Medicine Features</title><p>Modern medical indicators based on laboratory testing provide the possibility for intelligent discrimination of TCM syndromes. Therefore, in this study, modern medical indicators were integrated with TCM features for further exploration. A total of 93 features were used to construct the model. The evaluation metrics for models using all 93 features are presented in <xref ref-type="table" rid="table1">Table 1</xref> and <xref ref-type="fig" rid="figure4">Figure 4A</xref>. We found that GBM and LGB achieved the highest AUC scores of 0.8329 and 0.7693, respectively, indicating their superior overall discriminative performance. GBM also obtained the highest ACC score of 0.8000, closely followed by RIDGE with a score of 0.7475, suggesting strong overall classification accuracy. LASSO, RIDGE, and GBM achieved the highest sensitivity scores of 0.8430, 0.8388, and 0.8283, respectively, indicating good performance in correctly identifying positive samples and reducing false negatives. SVM, LGB, RF, and GBM achieved the highest specificity scores, suggesting these models had the lowest false-positive rates. Both GBM and LGB also achieved relatively high MCC scores of 0.5043 and 0.4068, respectively, demonstrating their effectiveness in handling imbalanced datasets.</p><p>Internal validation showed that GBM, RF, and XGB achieved the highest AUC scores of 0.7085, 0.7477, and 0.7146, respectively. Additionally, we calculated the confusion matrix for each model in the internal validation cohort, as shown in <xref ref-type="fig" rid="figure4">Figure 4B</xref>. The sum of correctly predicted cold and hot samples reflects the overall predictive accuracy of each model. GBM, LR, RF, XGB, LGB, RIDGE, LASSO, and SVM correctly predicted 53, 52, 53, 57, 56, 49, 53, and 52 cold and hot samples, respectively. These findings further demonstrate the effectiveness of these models in distinguishing cold and heat patterns in viral pneumonia.</p><p>Overall, the results suggest that models incorporating both TCM and modern medicine features exhibit strong predictive performance for differentiating between cold and hot syndromes in viral pneumonia. Among them, the GBM algorithm demonstrated a particularly prominent discriminative capability. Therefore, GBM was selected as the optimal classified model based on the full set of 93 features for subsequent analysis.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Comparison of models based on 5-fold cross-validation results using 93 features from traditional Chinese medicine and modern medicine.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Data cohort and evaluation</td><td align="left" valign="bottom">Gradient boosting machine</td><td align="left" valign="bottom">Logistic regression</td><td align="left" valign="bottom">Random forest</td><td align="left" valign="bottom">Extreme gradient boosting</td><td align="left" valign="bottom">Light gradient boosting machine</td><td align="left" valign="bottom">Ridge regression</td><td align="left" valign="bottom">Least absolute shrinkage and selection operator</td><td align="left" valign="bottom">Support vector machine</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="9">Training</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Area under the curve</td><td align="left" valign="top">0.8329</td><td align="left" valign="top">0.6477</td><td align="left" valign="top">0.7272</td><td align="left" valign="top">0.7546</td><td align="left" valign="top">0.7693</td><td align="left" valign="top">0.6970</td><td align="left" valign="top">0.6974</td><td align="left" valign="top">0.6514</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Accuracy</td><td align="left" valign="top">0.8000</td><td align="left" valign="top">0.6787</td><td align="left" valign="top">0.6689</td><td align="left" valign="top">0.6984</td><td align="left" valign="top">0.7246</td><td align="left" valign="top">0.7475</td><td align="left" valign="top">0.7475</td><td align="left" valign="top">0.4459</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Sensitivity</td><td align="left" valign="top">0.8283</td><td align="left" valign="top">0.7365</td><td align="left" valign="top">0.6582</td><td align="left" valign="top">0.7172</td><td align="left" valign="top">0.7158</td><td align="left" valign="top">0.8388</td><td align="left" valign="top">0.8430</td><td align="left" valign="top">0.2975</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Specificity</td><td align="left" valign="top">0.7016</td><td align="left" valign="top">0.5187</td><td align="left" valign="top">0.7066</td><td align="left" valign="top">0.6326</td><td align="left" valign="top">0.7327</td><td align="left" valign="top">0.4764</td><td align="left" valign="top">0.4656</td><td align="left" valign="top">0.9018</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Matthews correlation coefficient</td><td align="left" valign="top">0.5043</td><td align="left" valign="top">0.2341</td><td align="left" valign="top">0.3190</td><td align="left" valign="top">0.3177</td><td align="left" valign="top">0.4068</td><td align="left" valign="top">0.3364</td><td align="left" valign="top">0.3407</td><td align="left" valign="top">0.2161</td></tr><tr><td align="left" valign="top" colspan="9">Internal validation</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Area under the curve</td><td align="left" valign="top">0.7085</td><td align="left" valign="top">0.6854</td><td align="left" valign="top">0.7477</td><td align="left" valign="top">0.7146</td><td align="left" valign="top">0.6800</td><td align="left" valign="top">0.6392</td><td align="left" valign="top">0.6908</td><td align="left" valign="top">0.6031</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Accuracy</td><td align="left" valign="top">0.6883</td><td align="left" valign="top">0.6753</td><td align="left" valign="top">0.6883</td><td align="left" valign="top">0.7403</td><td align="left" valign="top">0.7273</td><td align="left" valign="top">0.6364</td><td align="left" valign="top">0.6883</td><td align="left" valign="top">0.6753</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Sensitivity</td><td align="left" valign="top">0.9615</td><td align="left" valign="top">0.8846</td><td align="left" valign="top">0.9808</td><td align="left" valign="top">0.9808</td><td align="left" valign="top">0.9615</td><td align="left" valign="top">0.8462</td><td align="left" valign="top">0.9231</td><td align="left" valign="top">1.0000</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Specificity</td><td align="left" valign="top">0.1200</td><td align="left" valign="top">0.2400</td><td align="left" valign="top">0.0800</td><td align="left" valign="top">0.2400</td><td align="left" valign="top">0.2400</td><td align="left" valign="top">0.2000</td><td align="left" valign="top">0.2000</td><td align="left" valign="top">0.0000</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Matthews correlation coefficient</td><td align="left" valign="top">0.1549</td><td align="left" valign="top">0.1609</td><td align="left" valign="top">0.1471</td><td align="left" valign="top">0.3596</td><td align="left" valign="top">0.3093</td><td align="left" valign="top">0.0577</td><td align="left" valign="top">0.1794</td><td align="left" valign="top">0.0000</td></tr></tbody></table></table-wrap><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Performance evaluation of the cold and hot syndrome identification models based on integrated traditional Chinese medicine (TCM) and modern medical features. (A) Radar chart comparing the performance of 8 machine learning models in the training and internal validation cohorts. (B) Confusion matrix analysis of the 8 models in the internal validation cohort. ACC: accuracy; AUC: area under the curve; GBM: gradient boosting machine; LASSO: least absolute shrinkage and selection operator; LGB: light gradient boosting machine; LR: logistic regression; MCC: Matthews correlation coefficient; RF: random forest; RIDGE: ridge regression; SEN: sensitivity; SPE: specificity; SVM: support vector machine; XGB: extreme gradient boosting.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e64725_fig04.png"/></fig></sec><sec id="s3-3"><title>Optimal Feature Ascertainment</title><p>Based on the optimum classified model (GBM) and the ranking of &#x201C;feature importance,&#x201D; we identified 23 key features with importance values more than twice the median. These were temperature (T), red cell distribution width-SD (RDW-SD), creatinine (CREA), total bilirubin (TBIL), globulin (GLO), C-reactive protein (CRP), unconjugated bilirubin (IBIL), white blood cell (WBC), neutrophil percentage (NEU%), aspartate transaminase/alanine transaminase (AST/ALT), total cholesterol (TCHO), thrombocytocrit (PCT), oxygen saturation under load (SaO<sub>2</sub>), age, platelets, mean platelet volume, lactate dehydrogenase, mean corpuscular hemoglobin concentration, urea, erythrocyte/red blood cell, Na, ORF1ab gene of novel coronavirus by nose test (nCovORF1ab), and albumin.</p><p>Subsequently, to identify the best-performing model with the fewest features, we examined how the number of top-ranked features influenced model performance (AUC, ACC, and MCC) using the GBM algorithm. As shown in <xref ref-type="fig" rid="figure5">Figure 5A and B</xref>, as the number of features increases, model performance gradually improves. Notably, at the 14-feature mark, the model achieved strong performance with an AUC of 0.7604, an ACC of 0.7082, and an MCC of 0.3515. To validate the robustness of our feature selection approach, we also used the SHAP feature importance ranking to select the top 14 features and construct a model. This model achieved an AUC of 0.7406, which was slightly lower than that obtained using the feature importance method (0.7604). Therefore, the feature importance method was ultimately retained as the feature selection approach for this study.</p><p>Finally, considering both the practicality of indicator testing and the feasibility of the clinical application, this study selected the top 14 features, excluding SaO<sub>2</sub> (under load), as the optimal set for differentiating between cold and hot syndromes in viral pneumonia. These features are temperature (T), RDW-SD, CREA, TBIL, GLO, CRP, IBIL, WBC, NEU%, AST/ALT, TCHO, PCT, and age (AGE), as illustrated in (<xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>).</p><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Identification of key features based on feature importance analysis and model cross-validation. (A) Effect of the number of selected key features (n=23) on model performance using the gradient boosting machine (GBM) algorithm. (B) Feature importance scores of the top 14 key features identified by the GBM model. ACC: accuracy; AUC: area under the curve; AST/ALT: aspartate transaminase/alanine transaminase; CREA: creatinine; CRP: C-reactive protein; GLO: globulin; IBIL: unconjugated bilirubin; MCC: Matthews correlation coefficient; NEU%: neutrophil percentage; PCT: thrombocytocrit; RDW-SD: red cell distribution width-SD; SaO<sub>2</sub>: oxygen saturation under load; T: temperature; TBIL: total bilirubin; TCHO: total cholesterol; WBC: white blood cell.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e64725_fig05.png"/></fig></sec><sec id="s3-4"><title>Performance Evaluation and Optimal Model Establishment</title><p>To achieve optimal GBM model performance, we reconstructed the GBM model based on 13 optimizing features. Ultimately, the model was adjusted to threshold=0.99999, n_estimators=797, max_depth=8, min_samples_split=2, and min_samples_leaf=1. Simultaneously, the performance of the model with 13 features was further evaluated using 5-fold cross-validation, and the results suggested that the model performance was outstanding, as the average AUC value reached 0.7788 (<xref ref-type="fig" rid="figure6">Figure 6A</xref>). Model verification results showed that the AUC was 0.7645 by the internal test cohort (<xref ref-type="fig" rid="figure6">Figure 6B</xref>). Furthermore, the additional external test results showed that the model performance for AUC, ACC, sensitivity, specificity, and MCC is 0.8428, 0.6627, 0.7222, 0.6170, and 0.3369, respectively. These results validated the excellent performance of the model.</p><p>Moreover, we found that the temperature in the hot syndrome group was significantly higher than in the cold syndrome group (<italic>P</italic>=.02). By contrast, RDW-SD (<italic>P</italic>&#x003C;.001), NEU% (<italic>P</italic>=.01), TCHO (<italic>P</italic>=.003), PCT (<italic>P</italic>&#x003C;.001), and AGE (<italic>P</italic>&#x003C;.001) were significantly lower in the hot syndrome group compared with the cold syndrome group, as shown in <xref ref-type="table" rid="table2">Table 2</xref> and <xref ref-type="fig" rid="figure7">Figure 7</xref>. These results align with previous studies, which have reported that temperature, AGE, CREA, and RDW-SD are closely associated with the severity of viral pneumonia [<xref ref-type="bibr" rid="ref29">29</xref>-<xref ref-type="bibr" rid="ref33">33</xref>], supporting the validity of our findings.</p><p>These results suggest that machine learning algorithms perform well in differentiating between TCM cold and hot syndromes in viral pneumonia. The optimal model was constructed using 13 key features (T, RDW-SD, CREA, TBIL, GLO, CRP, IBIL, WBC, NEU%, AST/ALT, TCHO, PCT, and AGE), combined with the GBM algorithm. Among these, temperature (T), RDW-SD, NEU%, TCHO, PCT, and AGE appear to be the most relevant features for predicting cold and hot syndrome.</p><fig position="float" id="figure6"><label>Figure 6.</label><caption><p>ROC curves and corresponding AUCs for cross-validation on the training and test sets. (A) ROC curve and classification performance of the final model set on the training set using 5-fold cross-validation. The x-axis represents the false-positive rate (FPR), and the y-axis represents the true-positive rate (TPR). (B) ROC curve and classification performance of the final model on the test set. The x-axis represents the FPR, and the y-axis represents the TPR. AUC: area under the curve; GBM: gradient boosting machine; ROC: receiver operating characteristic.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e64725_fig06.png"/></fig><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>The 13 optimal features for distinguishing between cold and hot syndromes in analysis.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Clinical features</td><td align="left" valign="bottom">Cold (n=97), median (IQR)</td><td align="left" valign="bottom">Hot (n=285), median (IQR)</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top">Temperature (&#x00B0;C)</td><td align="left" valign="top">36.600 (36.500-36.950)</td><td align="left" valign="top">36.800 (36.500-36.95)</td><td align="left" valign="top">.02</td></tr><tr><td align="left" valign="top">Red cell distribution width (%)</td><td align="left" valign="top">44.500 (42.800-46.850)</td><td align="left" valign="top">43.400 (41.80-45.100)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Creatinine (&#x03BC;mol/L)</td><td align="left" valign="top">63.000 (54.000-78.000)</td><td align="left" valign="top">61.000 (51.000-73.500)</td><td align="left" valign="top">.13</td></tr><tr><td align="left" valign="top">Total bilirubin (&#x03BC;mol/L)</td><td align="left" valign="top">9.400 (7.350-12.450)</td><td align="left" valign="top">9.000 (7.200-11.550)</td><td align="left" valign="top">.31</td></tr><tr><td align="left" valign="top">Globulin (g/L)</td><td align="left" valign="top">27.500 (24.150-30.750)</td><td align="left" valign="top">26.600 (23.600-29.600)</td><td align="left" valign="top">.18</td></tr><tr><td align="left" valign="top">C-reactive protein (mg/L)</td><td align="left" valign="top">2.670 (1.355-6.530)</td><td align="left" valign="top">2.670 (0.865-7.235)</td><td align="left" valign="top">.41</td></tr><tr><td align="left" valign="top">Unconjugated bilirubin (&#x03BC;mol/L)</td><td align="left" valign="top">5.400 (4.000-6.900)</td><td align="left" valign="top">5.200 (3.900-6.800)</td><td align="left" valign="top">.28</td></tr><tr><td align="left" valign="top">White blood cell (&#x00D7;10<sup>9</sup>/L)</td><td align="left" valign="top">5.300 (4.450-6.400)</td><td align="left" valign="top">5.100 (4.100-6.250)</td><td align="left" valign="top">.22</td></tr><tr><td align="left" valign="top">Neutrophil percentage (%)</td><td align="left" valign="top">62.000 (56.000-68.500)</td><td align="left" valign="top">58.000 (50.500-67.000)</td><td align="left" valign="top">.01</td></tr><tr><td align="left" valign="top">Aspartate transaminase/alanine transaminase (%)</td><td align="left" valign="top">1.200 (0.800-1.445)</td><td align="left" valign="top">1.100 (0.800-1.500)</td><td align="left" valign="top">.68</td></tr><tr><td align="left" valign="top">Total cholesterol (mmol/L)</td><td align="left" valign="top">3.900 (3.630-4.400)</td><td align="left" valign="top">3.700 (3.190-4.365)</td><td align="left" valign="top">.003</td></tr><tr><td align="left" valign="top">Thrombocytocrit (%)</td><td align="left" valign="top">0.240 (0.210-0.290)</td><td align="left" valign="top">0.240 (0.200-0.290)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Age (years)</td><td align="left" valign="top">47.000 (34.000&#x2010;67.000)</td><td align="left" valign="top">37.000 (24.000&#x2010;57.000)</td><td align="left" valign="top">&#x003C;.001</td></tr></tbody></table></table-wrap><fig position="float" id="figure7"><label>Figure 7.</label><caption><p>Violin plots showing the relationships between cold and hot syndromes and the expression levels of optimal clinical features. The horizontal axis represents the different syndromes (cold and hot), while the vertical axis indicates the expression levels of the corresponding clinical features. The plots illustrate the distribution and density of feature values, highlighting differences between the 2 syndrome groups. AST/ALT: aspartate transaminase/alanine transaminase; CREA: creatinine; CRP: C-reactive protein; GLO: globulin; IBIL: unconjugated bilirubin; NEU%: neutrophil percentage; ns: not significant; PCT: thrombocytocrit; RDW-SD: red cell distribution width-SD; T: temperature; TBIL: total bilirubin; TCHO: total cholesterol; WBC: white blood cell; *<italic>P</italic>&#x003C;.05, **<italic>P</italic>&#x003C;.01 versus the cold.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e64725_fig07.png"/></fig></sec><sec id="s3-5"><title>Interactive Web Server</title><p>To enhance user experience, an interactive web server named ACHVP was developed in this study, allowing users to test, explore, and experience the proposed method. The platform is designed to be highly convenient and user-friendly&#x2014;users simply input relevant numerical data into designated textboxes and click the &#x201C;Submit&#x201D; button. The system then performs comprehensive data processing and analysis, presenting the predicted syndrome classification results on the output interface. The home page of the web server, developed for identifying cold and hot syndrome patterns in patients with viral pneumonia, is illustrated in <xref ref-type="fig" rid="figure8">Figure 8</xref>. The server is deployed in a Linux environment. The backend is developed in Python using the FastAPI framework to ensure efficient data processing and application programming interface management, while the front end is built with JavaScript and the Vue.js framework for a responsive and interactive user interface. Users can access the web server via any standard web browser, such as Google Chrome, Mozilla Firefox, or Safari, using the link specified in [<xref ref-type="bibr" rid="ref34">34</xref>]. This web-based tool demonstrates significant potential as a practical diagnostic aid, facilitating early detection of cold and hot syndromes in patients with viral pneumonia. It can support TCM practitioners in syndrome differentiation and guide more precise Chinese herbal medicine prescriptions in clinical practice.</p><fig position="float" id="figure8"><label>Figure 8.</label><caption><p>Web server of the ACHVP method.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e64725_fig08.png"/></fig></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>Dialectical treatment is a fundamental principle in TCM for diagnosing and treating diseases, with cold and hot syndromes serving as 2 key components for identifying the nature of illness [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref35">35</xref>-<xref ref-type="bibr" rid="ref38">38</xref>]. In recent years, the study of TCM cold and hot syndrome has become a focal point in disease research. Numerous studies have shown that cold and hot syndromes also exhibit major TCM diagnostic patterns in various viral pulmonary diseases, including COVID-19 and SARS [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. Based on these syndrome classifications, TCM has demonstrated a prominent role in alleviating symptoms, shortening treatment duration, and reducing the progression to severe pneumonia in patients with viral pneumonia [<xref ref-type="bibr" rid="ref39">39</xref>-<xref ref-type="bibr" rid="ref43">43</xref>]. For example, formulas such as Hanshiyi for cold syndrome [<xref ref-type="bibr" rid="ref44">44</xref>] and Jinhua Qinggan Granules for hot syndrome have shown favorable clinical efficacy [<xref ref-type="bibr" rid="ref45">45</xref>]. Therefore, the rapid, accurate, and specific identification of cold or hold syndrome is essential for the effective application of TCM in the treatment of viral pulmonary diseases. However, the abstract and complex nature of TCM syndrome differentiation poses challenges in accurately distinguishing between cold and hot syndromes in clinical practice. Machine learning offers a promising solution to this challenge by supporting clinicians in syndrome differentiation and facilitating more precise treatment decisions. Consequently, there is an urgent need to integrate TCM theories of cold and hot syndromes with modern laboratory diagnostics and machine learning approaches to advance the modernized differentiation and treatment of viral pneumonia.</p><p>In this study, 8 machine learning algorithms were applied to develop and evaluate a model for differentiating TCM cold and hot syndromes in viral pneumonia, using clinical data from 1484 patients across 2 medical centers. Among the models incorporating both TCM and modern medical features, the GBM model demonstrated superior learning capability, achieving an AUC of 0.8329. This indicates that GBM was particularly effective in distinguishing cold and hot syndromes based on a given dataset. The &#x201C;feature importance&#x201D; method of the GBM model was subsequently used to rank all features, from which the top 13 features were selected based on the highest AUC value. To validate the model&#x2019;s effectiveness and generalizability, both internal and external test sets were used, each demonstrating strong discriminatory performance. As a result, the optimal model was constructed using the GBM algorithm and 13 selected features (T, RDW-SD, CREA, TBIL, GLO, CRP, IBIL, WBC, NEU%, AST/ALT, TCHO, PCT, and AGE), achieving an AUC of 0.7788. These findings suggest that effectively combining modern medical indicators, primarily based on laboratory tests, with TCM features primarily based on clinical observation may offer a viable pathway toward the modernization of TCM syndrome differentiation. This approach provides a foundation for the objectification and standardization of TCM diagnostic practices. Furthermore, the proposed model holds promise as a practical tool to assist clinicians in accurately identifying cold and hot syndromes in viral pneumonia, thereby informing appropriate and individualized treatment strategies.</p></sec><sec id="s4-2"><title>Comparison With Prior Work</title><p>Machine learning, as an advanced artificial intelligence technology, has demonstrated broad potential in the field of &#x201C;artificial intelligence+TCM diagnoses.&#x201D; For example, Zhang et al [<xref ref-type="bibr" rid="ref46">46</xref>] proposed a comprehensive model using convolutional neural networks to classify 187 types of TCM diseases. Wen et al [<xref ref-type="bibr" rid="ref47">47</xref>] also applied deep neural networks to identify tongue image data and determine patients&#x2019; constitutions, effectively addressing the imbalance problem among constitution categories. However, limited research has focused on identifying TCM cold and hot syndromes in viral pneumonia by integrating both TCM theory and modern medicine through machine learning approaches. Although some scholars have attempted to explore the cold and hot attributes of diseases to guide clinical treatment, most studies have been limited to network analysis, clustering, or laboratory testing, without incorporating artificial intelligence methods. For instance, Li et al&#x2019;s [<xref ref-type="bibr" rid="ref11">11</xref>] network analysis revealed that the leptin biomarker indicated low levels of energy metabolism in patients with cold syndrome, while the human monocyte chemoattractant protein-1 (CCL2/MCP1) biomarker suggested intensified immune regulation in patients with hot syndrome, based on a study involving patients with chronic superficial gastritis and chronic atrophic gastritis. Wang et al [<xref ref-type="bibr" rid="ref13">13</xref>] differentiated heat and cold patterns in rheumatoid arthritis through cluster and factor analyses to guide clinical medication. Wu et al [<xref ref-type="bibr" rid="ref48">48</xref>] investigated TCM cold and hot constitutions using pulse wave parameters such as augmentation index and heart rate variability. Although some individual studies have applied artificial intelligence to differentiate cold and hot properties, most efforts have been limited to identifying the properties of Chinese herbal medicines. For example, Lin et al [<xref ref-type="bibr" rid="ref49">49</xref>] developed a classification strategy for the cold and hot properties of Chinese herbal medicines using artificial intelligence and biological experiments. Wei et al [<xref ref-type="bibr" rid="ref50">50</xref>] applied machine learning techniques to intelligently identify the cold-hot nature of Chinese herbal medicines based on the similarity of their volatile oil ingredients. Therefore, this study innovatively constructs a model for differentiating cold and hot syndromes in viral pneumonia using machine learning approaches that integrate TCM and modern medicine, aiming to assist in diagnosis and medication guidance for viral pneumonia in clinical practice.</p><p>It is worth noting that in this study, we collected a large number of clinical features, including patients&#x2019; symptoms, signs, laboratory examination results, and other relevant information, which were essential for training and testing the machine learning models. As shown in <xref ref-type="table" rid="table3">Table 3</xref>, based on the model training results using only 19 TCM features, we found that the AUC values of GBM, LR, RF, XGB, LGB, RIDGE, LASSO, and SVM were 0.6942, 0.6317, 0.6783, 0.6787, 0.6055, 0.6151, 0.6145, and 0.5874, respectively. Meanwhile, the study also attempted to build models using only 70 laboratory results. The AUC values for GBM, LR, RF, XGB, LGB, RIDGE, LASSO, and SVM were 0.6799, 0.6282, 0.6797, 0.6910, 0.7345, 0.6637, 0.6157, and 0.6618, respectively. Among them, the GBM model constructed using TCM features achieved an AUC of 0.6942, outperforming the GBM model constructed using laboratory features, which had an AUC of 0.6799. Internal validation and the confusion matrix results also demonstrated performance consistent with the training results, as shown in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>. These findings suggest that the models possess auxiliary diagnostic value for differentiating TCM cold and hot syndromes in viral pneumonia.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Comparison of model results by 5-fold cross-validation based on different features of traditional Chinese medicine and modern medicine.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Features and evaluation</td><td align="left" valign="bottom">Gradient boosting machine</td><td align="left" valign="bottom">Logistic regression</td><td align="left" valign="bottom">Random forest</td><td align="left" valign="bottom">Extreme gradient boosting</td><td align="left" valign="bottom">Light gradient boosting machine</td><td align="left" valign="bottom">Ridge regression</td><td align="left" valign="bottom">Least absolute shrinkage and selection operator</td><td align="left" valign="bottom">Support vector machine</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="9">Traditional Chinese medicine</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Area under the curve</td><td align="char" char="." valign="top">0.6942</td><td align="char" char="." valign="top">0.6317</td><td align="char" char="." valign="top">0.6783</td><td align="char" char="." valign="top">0.6787</td><td align="char" char="." valign="top">0.6055</td><td align="char" char="." valign="top">0.6151</td><td align="char" char="." valign="top">0.6145</td><td align="char" char="." valign="top">0.5874</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Accuracy</td><td align="char" char="." valign="top">0.6851</td><td align="char" char="." valign="top">0.5312</td><td align="char" char="." valign="top">0.5509</td><td align="char" char="." valign="top">0.6031</td><td align="char" char="." valign="top">0.5155</td><td align="char" char="." valign="top">0.5180</td><td align="char" char="." valign="top">0.5049</td><td align="char" char="." valign="top">0.7508</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Sensitivity</td><td align="char" char="." valign="top">0.7365</td><td align="char" char="." valign="top">0.4737</td><td align="char" char="." valign="top">0.5077</td><td align="char" char="." valign="top">0.5908</td><td align="char" char="." valign="top">0.4389</td><td align="char" char="." valign="top">0.4258</td><td align="char" char="." valign="top">0.4117</td><td align="char" char="." valign="top">0.9928</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Specificity</td><td align="char" char="." valign="top">0.5804</td><td align="char" char="." valign="top">0.7316</td><td align="char" char="." valign="top">0.7457</td><td align="char" char="." valign="top">0.7006</td><td align="char" char="." valign="top">0.7233</td><td align="char" char="." valign="top">0.7854</td><td align="char" char="." valign="top">0.7723</td><td align="char" char="." valign="top">0.2601</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Matthews correlation coefficient</td><td align="char" char="." valign="top">0.2737</td><td align="char" char="." valign="top">0.1689</td><td align="char" char="." valign="top">0.2145</td><td align="char" char="." valign="top">0.2400</td><td align="char" char="." valign="top">0.1332</td><td align="char" char="." valign="top">0.1821</td><td align="char" char="." valign="top">0.1563</td><td align="char" char="." valign="top">0.2385</td></tr><tr><td align="left" valign="top" colspan="9">Modern medicine</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Area under the curve</td><td align="char" char="." valign="top">0.6799</td><td align="char" char="." valign="top">0.6282</td><td align="char" char="." valign="top">0.6797</td><td align="char" char="." valign="top">0.6910</td><td align="char" char="." valign="top">0.7345</td><td align="char" char="." valign="top">0.6637</td><td align="char" char="." valign="top">0.6157</td><td align="char" char="." valign="top">0.6618</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Accuracy</td><td align="char" char="." valign="top">0.7508</td><td align="char" char="." valign="top">0.7508</td><td align="char" char="." valign="top">0.7541</td><td align="char" char="." valign="top">0.7672</td><td align="char" char="." valign="top">0.7803</td><td align="char" char="." valign="top">0.7639</td><td align="char" char="." valign="top">0.7180</td><td align="char" char="." valign="top">0.7639</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Sensitivity</td><td align="char" char="." valign="top">0.9441</td><td align="char" char="." valign="top">0.9185</td><td align="char" char="." valign="top">0.9742</td><td align="char" char="." valign="top">0.9400</td><td align="char" char="." valign="top">0.9314</td><td align="char" char="." valign="top">0.8968</td><td align="char" char="." valign="top">0.8539</td><td align="char" char="." valign="top">1.0000</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Specificity</td><td align="char" char="." valign="top">0.1257</td><td align="char" char="." valign="top">0.2105</td><td align="char" char="." valign="top">0.0410</td><td align="char" char="." valign="top">0.2067</td><td align="char" char="." valign="top">0.2914</td><td align="char" char="." valign="top">0.3324</td><td align="char" char="." valign="top">0.2762</td><td align="char" char="." valign="top">0.0000</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Matthews correlation coefficient</td><td align="char" char="." valign="top">0.1269</td><td align="char" char="." valign="top">0.1585</td><td align="char" char="." valign="top">0.0335</td><td align="char" char="." valign="top">0.1927</td><td align="char" char="." valign="top">0.2871</td><td align="char" char="." valign="top">0.2672</td><td align="char" char="." valign="top">0.1752</td><td align="char" char="." valign="top">0.0000</td></tr><tr><td align="left" valign="top" colspan="9">Traditional Chinese medicine and modern medicine</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Area under the curve</td><td align="char" char="." valign="top">0.8329</td><td align="char" char="." valign="top">0.6477</td><td align="char" char="." valign="top">0.7272</td><td align="char" char="." valign="top">0.7546</td><td align="char" char="." valign="top">0.7693</td><td align="char" char="." valign="top">0.6970</td><td align="char" char="." valign="top">0.6974</td><td align="char" char="." valign="top">0.6514</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Accuracy</td><td align="char" char="." valign="top">0.8000</td><td align="char" char="." valign="top">0.6787</td><td align="char" char="." valign="top">0.6689</td><td align="char" char="." valign="top">0.6984</td><td align="char" char="." valign="top">0.7246</td><td align="char" char="." valign="top">0.7475</td><td align="char" char="." valign="top">0.7475</td><td align="char" char="." valign="top">0.4459</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Sensitivity</td><td align="char" char="." valign="top">0.8283</td><td align="char" char="." valign="top">0.7365</td><td align="char" char="." valign="top">0.6582</td><td align="char" char="." valign="top">0.7172</td><td align="char" char="." valign="top">0.7158</td><td align="char" char="." valign="top">0.8388</td><td align="char" char="." valign="top">0.8430</td><td align="char" char="." valign="top">0.2975</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Specificity</td><td align="char" char="." valign="top">0.7016</td><td align="char" char="." valign="top">0.5187</td><td align="char" char="." valign="top">0.7066</td><td align="char" char="." valign="top">0.6326</td><td align="char" char="." valign="top">0.7327</td><td align="char" char="." valign="top">0.4764</td><td align="char" char="." valign="top">0.4656</td><td align="char" char="." valign="top">0.9018</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Matthews correlation coefficient</td><td align="char" char="." valign="top">0.5043</td><td align="char" char="." valign="top">0.2341</td><td align="char" char="." valign="top">0.3190</td><td align="char" char="." valign="top">0.3177</td><td align="char" char="." valign="top">0.4068</td><td align="char" char="." valign="top">0.3364</td><td align="char" char="." valign="top">0.3407</td><td align="char" char="." valign="top">0.2161</td></tr></tbody></table></table-wrap><p>Based on &#x201C;feature importance&#x201D; or &#x201C;coef,&#x201D; the 8 models were further used to evaluate the significance of TCM features in distinguishing cold and hot syndromes of viral pneumonia. We found that, according to the significance values, there were 7 common features with importance values equal to or greater than the median in the GBM, RF, XGB, and LGB models, namely, fatigue, sore throat, fever, expectoration, cough, body pain, and diminished sense of smell. Interestingly, sore throat and fever also appeared among the features with importance values equal to or greater than the median in LR, RIDGE, LASSO, and SVM models. Based on this, we believe that fatigue, sore throat, fever, expectoration, cough, body pain, and diminished sense of smell may be the primary distinguishing factors for differentiating between cold and hot syndromes in the TCM diagnosis of viral pneumonia, which aligns with the key symptomatology commonly used by clinical TCM practitioners [<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref52">52</xref>]. Therefore, more attention should be given to these features, especially sore throat and fever, in the discrimination of cold and hot syndromes in viral pneumonia, as shown in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>. Unfortunately, the AUC values of these models did not exceed 0.7. We boldly speculate that this might be due to the quantification of TCM features not aligning with modern medical standards. Specifically, TCM features lack precise numerical values and are typically categorized as none, mild, moderate, or severe. Moreover, the identification of TCM features primarily relies on the subjective judgment of TCM practitioners and years of clinical experience, leading to a lack of standardization and objectivity. These factors may introduce noise and reduce the effectiveness of model training. Therefore, it is essential to develop objective indicators for TCM syndrome differentiation, further supporting the original intent of our study. In subsequent experiments, we integrated modern medicine features with TCM indicators and were pleasantly surprised to find that, compared with models trained solely on TCM features, those based on integrated TCM and modern medical features demonstrated superior performance in distinguishing cold and hot syndromes in viral pneumonia across 8 machine learning algorithms. This suggests that modern medical features can enhance the predictive value of TCM features.</p><p>In addition, the best model we developed indicated that the identification of cold and hot syndromes in viral pneumonia is closely related to 13 features: temperature, RDW-SD, CREA, TBIL, GLO, CRP, IBIL, WBC, NEU%, AST/ALT, TCHO, PCT, and AGE. Numerous studies have reported that temperature (T), CRP, and WBC hold statistical significance in distinguishing TCM cold and hot syndromes in rheumatoid arthritis [<xref ref-type="bibr" rid="ref53">53</xref>]. Furthermore, features such as AGE, NEU%, RDW-SD, and CRP are strongly associated with the severity of viral pneumonia and the development of chronic lung sequelae. For example, a study by Liu et al [<xref ref-type="bibr" rid="ref33">33</xref>] suggested that AGE and NEU% could serve as predictive factors for the severity of viral pneumonia. Shen et al [<xref ref-type="bibr" rid="ref31">31</xref>] also reported that RDW-SD is a key indicator for assessing the severity of viral pneumonia. Additionally, CRP and AGE play crucial roles in the diagnosis of viral pneumonia [<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref55">55</xref>], which is consistent with the findings of this study.</p></sec><sec id="s4-3"><title>Limitations</title><p>The accuracy of traditional TCM diagnosis of cold and hot syndromes largely depends on the skills and years of clinical experience of the practitioner. Subjective factors play a decisive role in this process. Compared with traditional TCM methods, the model developed in this study offers a more objective approach to differentiating cold and hot syndromes in viral pneumonia. It provides valuable decision support and medication guidance in clinical practice, especially for practitioners with limited TCM experience. This shift toward an objective, data-driven approach helps reduce reliance on subjective judgment, improves diagnostic accuracy, and ensures greater consistency in clinical decision-making. Additionally, the model can serve as a practical tool for TCM practitioners, especially in complex cases where traditional diagnostic methods may fall short.</p><p>Of course, this study has some limitations. First, it was a retrospective study, and all patient history data were obtained from the internal electronic medical record systems of the Second People&#x2019;s Hospital of Lanzhou and Lanzhou Heavy Ion Hospital. This may have introduced inaccuracies in the collection and recording of medical history, making it difficult to avoid information bias. Moreover, due to the limited clinical sample size, the conclusions, although statistically sound, require further validation and refinement in real-world applications to enhance the model&#x2019;s accuracy and stability.</p><p>In recent years, emerging large language models (LLMs) have demonstrated remarkable capabilities in natural language processing, knowledge integration, and complex reasoning [<xref ref-type="bibr" rid="ref56">56</xref>]. Given the nature of TCM theory, which often involves complex textual descriptions and implicit knowledge, LLMs could potentially offer new perspectives for model development in this study. These models may better understand and integrate the rich, diverse information contained in TCM literature, clinical records, and expert knowledge, thereby enriching the feature set and enhancing the interpretability of the models. For instance, LLMs could analyze the semantic relationships among TCM symptoms, syndromes, and treatment methods, helping to extract more meaningful features that may be difficult to identify using traditional machine learning approaches. Moreover, LLMs could assist in standardizing and structuring the subjective and qualitative information in TCM, thereby reducing the impact of inconsistent data representation. However, applying LLMs also poses challenges, such as ensuring the reliability of the extracted knowledge, addressing potential biases inherent in pretrained models, and efficiently integrating LLM-derived features with existing laboratory test data. In future work, we plan to collect more data to establish a local database and explore the integration of LLMs with traditional machine learning algorithms. By fully leveraging the advantages of both approaches, we aim to further enhance the performance of the TCM cold and hot syndrome differentiation model and advance the modernization and standardization of TCM diagnosis.</p></sec><sec id="s4-4"><title>Conclusion</title><p>This study aimed to establish a differentiation model for TCM cold and hot syndromes in patients with viral pneumonia using machine learning by exploring correlations between cold/hot syndromes and features from both TCM and modern medicine (such as general information, TCM characteristics, blood gas values, viral pneumonia indicators, biochemical indicators, routine blood test indicators, and coagulation indicators). We found that machine learning algorithms based on integrated TCM and modern medicine features outperformed models that used only TCM or only modern medicine features. Specifically, a model composed of 13 optimal features (T, RDW-SD, CREA, TBIL, GLO, CRP, IBIL, WBC, NEU%, AST/ALT, TCHO, PCT, and AGE) and the GBM algorithm effectively differentiated TCM syndromes. This study is the first to integrate the TCM cold and hot syndrome theory with laboratory-based modern medical tests using machine learning. By establishing the relationship between TCM syndrome theory (cold and hot syndromes) and indicators from both TCM and modern medicine, we aim to provide a new auxiliary diagnostic method for the clinical differentiation of cold and hot syndromes. This can support practitioners in making comprehensive diagnoses and identifying effective Chinese herbal medicine treatments, while also offering new insights for the modernization and scientific interpretation of TCM syndrome differentiation theory to guide treatment.</p></sec></sec></body><back><ack><p>This study was supported by the Major Science and Technology Project of Gansu Province (grant 22ZD1FA001), the Provincial University Industry Support Project in Gansu (grant 2020C-36), the Young Elite Scientists Sponsorship Program by the Gansu Association for Science and Technology (grant GXH20210611-02), and the 2023 Longyuan Youth Innovation and Entrepreneurship Talent Project (Gan Group Tong Zi [2023] No. 20).</p></ack><notes><sec><title>Data Availability</title><p>The datasets generated in this study are not publicly available due to hospital institutional review board regulations and patient privacy policies, but deidentified datasets are available from the corresponding author (YL) upon reasonable request. These deidentified datasets would include the model training set and the test set to facilitate independent model replications.</p></sec></notes><fn-group><fn fn-type="con"><p>XJ was responsible for formal analysis, investigation, project administration, writing the original draft, and reviewing and editing the manuscript. YW and JW contributed to the investigation, methodology, resources, supervision, validation, writing the original draft, and reviewing and editing. YH and QG were involved in formal analysis, investigation, methodology, writing the original draft, and reviewing and editing. LS and JZ participated in the investigation and methodology. JL, LL, and ZZ contributed to the investigation, methodology, resources, and supervision. SL was responsible for conceptualization, methodology, project administration, and reviewing and editing the manuscript. YL contributed to conceptualization, formal analysis, methodology, supervision, and reviewing and editing. All authors have read and approved the final manuscript.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">ACC</term><def><p>accuracy</p></def></def-item><def-item><term id="abb2">ALT</term><def><p>alanine transaminase</p></def></def-item><def-item><term id="abb3">AST</term><def><p>aspartate transaminase</p></def></def-item><def-item><term id="abb4">AUC</term><def><p>area under the curve</p></def></def-item><def-item><term id="abb5">CREA</term><def><p>creatinine</p></def></def-item><def-item><term id="abb6">CRP</term><def><p>C-reactive protein</p></def></def-item><def-item><term id="abb7">FN</term><def><p>false negative</p></def></def-item><def-item><term id="abb8">FP</term><def><p>false positive</p></def></def-item><def-item><term id="abb9">GBM</term><def><p>gradient boosting machine</p></def></def-item><def-item><term id="abb10">GLO</term><def><p>globulin</p></def></def-item><def-item><term id="abb11">IBIL</term><def><p>unconjugated bilirubin</p></def></def-item><def-item><term id="abb12">LASSO</term><def><p>least absolute shrinkage and selection operator</p></def></def-item><def-item><term id="abb13">LGB</term><def><p>light gradient boosting machine</p></def></def-item><def-item><term id="abb14">LLM</term><def><p>large language model</p></def></def-item><def-item><term id="abb15">LR</term><def><p>logistic regression</p></def></def-item><def-item><term id="abb16">MCC</term><def><p>Matthews correlation coefficient</p></def></def-item><def-item><term id="abb17">nCovORF1ab</term><def><p>Na, ORF1ab gene of novel coronavirus by nose test</p></def></def-item><def-item><term id="abb18">NEU%</term><def><p>neutrophil percentage</p></def></def-item><def-item><term id="abb19">PCT</term><def><p>thrombocytocrit</p></def></def-item><def-item><term id="abb20">RDW</term><def><p>red cell distribution width</p></def></def-item><def-item><term id="abb21">RF</term><def><p>random forest</p></def></def-item><def-item><term id="abb22">RIDGE</term><def><p>ridge regression</p></def></def-item><def-item><term id="abb23">SaO<sub>2</sub></term><def><p>oxygen saturation under load</p></def></def-item><def-item><term id="abb24">SEN</term><def><p>sensitivity</p></def></def-item><def-item><term id="abb25">SHAP</term><def><p>Shapley additive explanations</p></def></def-item><def-item><term id="abb26">SPE</term><def><p>specificity</p></def></def-item><def-item><term id="abb27">SVM</term><def><p>support vector machine</p></def></def-item><def-item><term id="abb28">T</term><def><p>temperature</p></def></def-item><def-item><term id="abb29">TBIL</term><def><p>total bilirubin</p></def></def-item><def-item><term id="abb30">TCHO</term><def><p>total cholesterol</p></def></def-item><def-item><term id="abb31">TCM</term><def><p>traditional Chinese medicine</p></def></def-item><def-item><term id="abb32">TN</term><def><p>true negative</p></def></def-item><def-item><term id="abb33">TP</term><def><p>true positive</p></def></def-item><def-item><term id="abb34">WBC</term><def><p>white blood cell</p></def></def-item><def-item><term id="abb35">XGB</term><def><p>extreme gradient boosting</p></def></def-item><def-item><term id="abb36">XGB</term><def><p>extreme gradient boosting</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gan</surname><given-names>X</given-names> </name><name name-style="western"><surname>Shu</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>X</given-names> </name><etal/></person-group><article-title>Network medicine framework reveals generic herb-symptom effectiveness of traditional Chinese medicine</article-title><source>Sci Adv</source><year>2023</year><month>10</month><day>27</day><volume>9</volume><issue>43</issue><fpage>eadh0215</fpage><pub-id pub-id-type="doi">10.1126/sciadv.adh0215</pub-id><pub-id pub-id-type="medline">37889962</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dong</surname><given-names>J</given-names> </name></person-group><article-title>The relationship between traditional Chinese medicine and modern medicine</article-title><source>Evid Based Complement Alternat Med</source><year>2013</year><volume>2013</volume><fpage>153148</fpage><pub-id pub-id-type="doi">10.1155/2013/153148</pub-id><pub-id pub-id-type="medline">23983772</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xu</surname><given-names>W</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Lu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Li</surname><given-names>M</given-names> </name><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name><name name-style="western"><surname>Tao</surname><given-names>W</given-names> </name></person-group><article-title>Traditional Chinese medicine Tongxie Yaofang treating irritable bowel syndrome with diarrhea and type 2 diabetes mellitus in rats with liver-depression and spleen-deficiency: a preliminary study</article-title><source>Front Nutr</source><year>2022</year><volume>9</volume><fpage>968930</fpage><pub-id pub-id-type="doi">10.3389/fnut.2022.968930</pub-id><pub-id pub-id-type="medline">36438735</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Song</surname><given-names>YN</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>J</given-names> </name><name name-style="western"><surname>Cai</surname><given-names>FF</given-names> </name><etal/></person-group><article-title>A metabolic mechanism analysis of Fuzheng-Huayu formula for improving liver cirrhosis with traditional Chinese medicine syndromes</article-title><source>Acta Pharmacol Sin</source><year>2018</year><month>06</month><volume>39</volume><issue>6</issue><fpage>942</fpage><lpage>951</lpage><pub-id pub-id-type="doi">10.1038/aps.2017.101</pub-id><pub-id pub-id-type="medline">29072258</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>X</given-names> </name><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>To study the protective effect of Huangqi Baihe granules on radiation brain injury based on network pharmacology and experiment</article-title><source>J Ethnopharmacol</source><year>2023</year><month>10</month><volume>315</volume><fpage>116610</fpage><pub-id pub-id-type="doi">10.1016/j.jep.2023.116610</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Huang</surname><given-names>K</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>P</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>Z</given-names> </name><etal/></person-group><article-title>Traditional Chinese medicine (TCM) in the treatment of COVID-19 and other viral infections: efficacies and mechanisms</article-title><source>Pharmacol Ther</source><year>2021</year><month>09</month><volume>225</volume><fpage>107843</fpage><pub-id pub-id-type="doi">10.1016/j.pharmthera.2021.107843</pub-id><pub-id pub-id-type="medline">33811957</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ni</surname><given-names>L</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>L</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>X</given-names> </name><etal/></person-group><article-title>Combating COVID-19 with integrated traditional Chinese and Western medicine in China</article-title><source>Acta Pharm Sin B</source><year>2020</year><month>07</month><volume>10</volume><issue>7</issue><fpage>1149</fpage><lpage>1162</lpage><pub-id pub-id-type="doi">10.1016/j.apsb.2020.06.009</pub-id><pub-id pub-id-type="medline">32834946</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>X</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>W</given-names> </name><name name-style="western"><surname>He</surname><given-names>W</given-names> </name><name name-style="western"><surname>Xie</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name></person-group><article-title>Meta-analysis of single-group rate of the distribution of traditional Chinese medicine syndromes in 2 139 patients with coronavirus disease 2019</article-title><source>Zhonghua Wei Zhong Bing Ji Jiu Yi Xue</source><year>2020</year><month>06</month><volume>32</volume><issue>6</issue><fpage>664</fpage><lpage>670</lpage><pub-id pub-id-type="doi">10.3760/cma.j.cn121430-202000509-00372</pub-id><pub-id pub-id-type="medline">32684209</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>SC</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>YQ</given-names> </name><name name-style="western"><surname>Bian</surname><given-names>GB</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>L</given-names> </name><name name-style="western"><surname>Ma</surname><given-names>R</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>MQ</given-names> </name></person-group><article-title>Clinical study on Qingfei oral liquid treating 507 cases of phlegm-heat obstructing lung syndrome in children virus pneumonia</article-title><source>World Chin Med</source><year>2016</year><volume>11</volume><issue>9</issue><fpage>1649</fpage><lpage>1653, 1658</lpage><pub-id pub-id-type="doi">10.3969/j.issn.1673-7202.2016.09.001</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Deng</surname><given-names>TT</given-names> </name></person-group><article-title>A discussion on diagnosis and treatment of SARS by traditional Chinese medicine</article-title><source>New Chin Med</source><year>2003</year><issue>6</issue><fpage>3</fpage><lpage>5</lpage><pub-id pub-id-type="doi">10.13457/j.cnki.jncm.2003.06.001</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>R</given-names> </name><name name-style="western"><surname>Ma</surname><given-names>T</given-names> </name><name name-style="western"><surname>Gu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Liang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Li</surname><given-names>S</given-names> </name></person-group><article-title>Imbalanced network biomarkers for traditional Chinese medicine syndrome in gastritis patients</article-title><source>Sci Rep</source><year>2013</year><volume>3</volume><fpage>1543</fpage><pub-id pub-id-type="doi">10.1038/srep01543</pub-id><pub-id pub-id-type="medline">23529020</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhou</surname><given-names>N</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Li</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Integrating strategies of chemistry, biochemistry and metabolomics for characterization of the medication principle of &#x201C;treating cold/heat syndrome with hot/cold herbs&#x201D;</article-title><source>J Ethnopharmacol</source><year>2019</year><month>07</month><day>15</day><volume>239</volume><fpage>111899</fpage><pub-id pub-id-type="doi">10.1016/j.jep.2019.111899</pub-id><pub-id pub-id-type="medline">31039429</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>W</given-names> </name><name name-style="western"><surname>Guan</surname><given-names>J</given-names> </name><name name-style="western"><surname>Li</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>X</given-names> </name></person-group><article-title>Rheumatoid arthritis characteristics and classification of heat and cold patterns&#x2013;an observational study</article-title><source>Heliyon</source><year>2023</year><month>02</month><volume>9</volume><issue>2</issue><fpage>e13439</fpage><pub-id pub-id-type="doi">10.1016/j.heliyon.2023.e13439</pub-id><pub-id pub-id-type="medline">36873147</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Feng</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Xie</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Chun</surname><given-names>L</given-names> </name><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name></person-group><article-title>Study on traditional Chinese medicine common syndrome characteristic of coronavirus disease 2019 based on latent structure combined with system clustering analysis</article-title><source>Zhonghua Wei Zhong Bing Ji Jiu Yi Xue</source><year>2020</year><month>05</month><volume>32</volume><issue>5</issue><fpage>537</fpage><lpage>543</lpage><pub-id pub-id-type="doi">10.3760/cma.j.cn121430-20200506-00620</pub-id><pub-id pub-id-type="medline">32576343</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Cheng</surname><given-names>L</given-names> </name><etal/></person-group><article-title>GC discrimination: identification of gastric cancer based on a milliliter of blood</article-title><source>Brief Bioinformatics</source><year>2021</year><month>01</month><day>18</day><volume>22</volume><issue>1</issue><fpage>536</fpage><lpage>544</lpage><pub-id pub-id-type="doi">10.1093/bib/bbaa006</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jain</surname><given-names>P</given-names> </name><name name-style="western"><surname>Yedukondalu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Chhabra</surname><given-names>H</given-names> </name><name name-style="western"><surname>Chauhan</surname><given-names>U</given-names> </name><name name-style="western"><surname>Sharma</surname><given-names>LD</given-names> </name></person-group><article-title>EEG-based detection of cognitive load using VMD and LightGBM classifier</article-title><source>Int J Mach Learn Cyber</source><year>2024</year><month>09</month><volume>15</volume><issue>9</issue><fpage>4193</fpage><lpage>4210</lpage><pub-id pub-id-type="doi">10.1007/s13042-024-02142-2</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Panda</surname><given-names>P</given-names> </name><name name-style="western"><surname>Bisoy</surname><given-names>SK</given-names> </name><name name-style="western"><surname>Panigrahi</surname><given-names>A</given-names> </name><etal/></person-group><article-title>BIMSSA: enhancing cancer prediction with salp swarm optimization and ensemble machine learning approaches</article-title><source>Front Genet</source><year>2025</year><month>01</month><day>6</day><volume>15</volume><fpage>1491602</fpage><pub-id pub-id-type="doi">10.3389/fgene.2024.1491602</pub-id><pub-id pub-id-type="medline">39834551</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Houkan</surname><given-names>A</given-names> </name><name name-style="western"><surname>Sahoo</surname><given-names>AK</given-names> </name><name name-style="western"><surname>Gochhayat</surname><given-names>SP</given-names> </name><etal/></person-group><article-title>Enhancing security in industrial IoT networks: machine learning solutions for feature selection and reduction</article-title><source>IEEE Access</source><year>2024</year><volume>12</volume><fpage>160864</fpage><lpage>160883</lpage><pub-id pub-id-type="doi">10.1109/ACCESS.2024.3481459</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Huang</surname><given-names>WT</given-names> </name><name name-style="western"><surname>Hung</surname><given-names>HH</given-names> </name><name name-style="western"><surname>Kao</surname><given-names>YW</given-names> </name><etal/></person-group><article-title>Application of neural network and cluster analyses to differentiate TCM patterns in patients with breast cancer</article-title><source>Front Pharmacol</source><year>2020</year><volume>11</volume><fpage>670</fpage><pub-id pub-id-type="doi">10.3389/fphar.2020.00670</pub-id><pub-id pub-id-type="medline">32457636</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhuo</surname><given-names>YY</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Kuang</surname><given-names>L</given-names> </name><etal/></person-group><article-title>The discriminative efficacy of retinal characteristics on two traditional Chinese syndromes in association with ischemic stroke</article-title><source>Evid Based Complement Alternat Med</source><year>2020</year><volume>2020</volume><fpage>6051831</fpage><pub-id pub-id-type="doi">10.1155/2020/6051831</pub-id><pub-id pub-id-type="medline">32308711</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kwon</surname><given-names>O</given-names> </name><name name-style="western"><surname>Na</surname><given-names>W</given-names> </name><name name-style="western"><surname>Kang</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Electronic medical record-based machine learning approach to predict the risk of 30-day adverse cardiac events after invasive coronary treatment: machine learning model development and validation</article-title><source>JMIR Med Inform</source><year>2022</year><month>05</month><day>11</day><access-date>2025-06-24</access-date><volume>10</volume><issue>5</issue><fpage>e26801</fpage><comment><ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/2022/5/e26801/">https://medinform.jmir.org/2022/5/e26801/</ext-link></comment><pub-id pub-id-type="doi">10.2196/26801</pub-id><pub-id pub-id-type="medline">35544292</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kim</surname><given-names>S</given-names> </name><name name-style="western"><surname>Park</surname><given-names>J</given-names> </name><name name-style="western"><surname>Son</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Development and validation of a machine learning algorithm for predicting diabetes retinopathy in patients with type 2 diabetes: algorithm development study</article-title><source>JMIR Med Inform</source><year>2025</year><month>02</month><day>7</day><access-date>2025-06-24</access-date><volume>13</volume><fpage>e58107</fpage><comment><ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/2025/1/e58107">https://medinform.jmir.org/2025/1/e58107</ext-link></comment><pub-id pub-id-type="doi">10.2196/58107</pub-id><pub-id pub-id-type="medline">39924304</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xu</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Cai</surname><given-names>X</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Machine learning-based risk factor analysis and prediction model construction for the occurrence of chronic heart failure: health ecologic study</article-title><source>JMIR Med Inform</source><year>2025</year><month>01</month><day>31</day><access-date>2025-06-24</access-date><volume>13</volume><fpage>e64972</fpage><comment><ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/2025/1/e64972">https://medinform.jmir.org/2025/1/e64972</ext-link></comment><pub-id pub-id-type="doi">10.2196/64972</pub-id><pub-id pub-id-type="medline">39889299</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>X</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>H</given-names> </name><name name-style="western"><surname>Nan</surname><given-names>S</given-names> </name><name name-style="western"><surname>Kong</surname><given-names>X</given-names> </name><name name-style="western"><surname>Duan</surname><given-names>H</given-names> </name><name name-style="western"><surname>Zhu</surname><given-names>H</given-names> </name></person-group><article-title>Dealing with missing, imbalanced, and sparse features during the development of a prediction model for sudden death using emergency medicine data: machine learning approach</article-title><source>JMIR Med Inform</source><year>2023</year><month>01</month><day>20</day><access-date>2025-06-24</access-date><volume>11</volume><fpage>e38590</fpage><comment><ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/2023/1/e38590">https://medinform.jmir.org/2023/1/e38590</ext-link></comment><pub-id pub-id-type="doi">10.2196/38590</pub-id><pub-id pub-id-type="medline">36662548</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>He</surname><given-names>JC</given-names> </name></person-group><source>TCM Diagnostics [Book in Chinese]</source><year>2017</year><publisher-name>People&#x2019;s Medical Publishing House</publisher-name><pub-id pub-id-type="other">978-7-117-23280-7</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Zheng</surname><given-names>XY</given-names> </name></person-group><source>Guiding Principle of Clinical Research on New Drugs of Traditional Chinese Medicine (Trial)</source><year>2002</year><publisher-name>China Medical Science and Technology Press</publisher-name><pub-id pub-id-type="other">750672586X</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Friedman</surname><given-names>JH</given-names> </name></person-group><article-title>Greedy function approximation: a gradient boosting machine</article-title><source>Ann Statist</source><year>2001</year><volume>29</volume><issue>5</issue><fpage>44</fpage><pub-id pub-id-type="doi">10.1214/aos/1013203451</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lu</surname><given-names>J</given-names> </name></person-group><article-title>A frequency-adaptive multi-objective suspension control strategy</article-title><source>J Dyn Syst Meas Control</source><year>2004</year><month>09</month><day>1</day><volume>126</volume><issue>3</issue><fpage>700</fpage><lpage>707</lpage><pub-id pub-id-type="doi">10.1115/1.1789979</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Goplen</surname><given-names>NP</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Son</surname><given-names>YM</given-names> </name><etal/></person-group><article-title>Tissue-resident CD8<sup>+</sup> T cells drive age-associated chronic lung sequelae after viral pneumonia</article-title><source>Sci Immunol</source><year>2020</year><month>11</month><day>6</day><volume>5</volume><issue>53</issue><fpage>eabc4557</fpage><pub-id pub-id-type="doi">10.1126/sciimmunol.abc4557</pub-id><pub-id pub-id-type="medline">33158975</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nie</surname><given-names>X</given-names> </name><name name-style="western"><surname>Cai</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Mortality prediction in cerebral hemorrhage patients using machine learning algorithms in intensive care units</article-title><source>Front Neurol</source><year>2020</year><volume>11</volume><fpage>610531</fpage><pub-id pub-id-type="doi">10.3389/fneur.2020.610531</pub-id><pub-id pub-id-type="medline">33551969</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shen</surname><given-names>C</given-names> </name><name name-style="western"><surname>Di</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>W</given-names> </name><etal/></person-group><article-title>Value of red blood cell distribution width in evaluating the severity of illness of novel coronavirus Delta variant</article-title><source>Zhonghua Wei Zhong Bing Ji Jiu Yi Xue</source><year>2022</year><month>05</month><volume>34</volume><issue>5</issue><fpage>475</fpage><lpage>480</lpage><pub-id pub-id-type="doi">10.3760/cma.j.cn121430-20220214-00127</pub-id><pub-id pub-id-type="medline">35728847</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Castro-Castro</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Garc&#x00ED;a-Tejada</surname><given-names>L</given-names> </name><name name-style="western"><surname>Arbiol-Roca</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Dynamic profiles and predictive values of some biochemical and haematological quantities in COVID-19 inpatients</article-title><source>Biochem Med (Zagreb)</source><year>2022</year><month>02</month><day>15</day><volume>32</volume><issue>1</issue><fpage>010706</fpage><pub-id pub-id-type="doi">10.11613/BM.2022.010706</pub-id><pub-id pub-id-type="medline">35210926</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Clinical and biochemical indexes from 2019-nCoV infected patients linked to viral loads and lung injury</article-title><source>Sci China Life Sci</source><year>2020</year><month>03</month><volume>63</volume><issue>3</issue><fpage>364</fpage><lpage>374</lpage><pub-id pub-id-type="doi">10.1007/s11427-020-1643-8</pub-id><pub-id pub-id-type="medline">32048163</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="web"><article-title>ACHVP</article-title><source>CPPDD</source><access-date>2025-06-12</access-date><comment><ext-link ext-link-type="uri" xlink:href="http://cppdd.cn:9999/#/service/ACHVP">http://cppdd.cn:9999/#/service/ACHVP</ext-link></comment></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Zhou</surname><given-names>S</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>M</given-names> </name><etal/></person-group><article-title>UHPLC/Q-TOFMS-based metabolomics for the characterization of cold and hot properties of Chinese materia medica</article-title><source>J Ethnopharmacol</source><year>2016</year><month>02</month><volume>179</volume><fpage>234</fpage><lpage>242</lpage><pub-id pub-id-type="doi">10.1016/j.jep.2015.12.061</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Li</surname><given-names>L</given-names> </name><name name-style="western"><surname>Song</surname><given-names>M</given-names> </name><name name-style="western"><surname>Yan</surname><given-names>J</given-names> </name><name name-style="western"><surname>Shi</surname><given-names>J</given-names> </name><name name-style="western"><surname>Yao</surname><given-names>Y</given-names> </name></person-group><article-title>Evaluating the traditional Chinese medicine (TCM) officially recommended in China for COVID-19 using ontology-based side-effect prediction framework (OSPF) and deep learning</article-title><source>J Ethnopharmacol</source><year>2021</year><month>05</month><volume>272</volume><fpage>113957</fpage><pub-id pub-id-type="doi">10.1016/j.jep.2021.113957</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xia</surname><given-names>F</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>C</given-names> </name><name name-style="western"><surname>Wan</surname><given-names>JB</given-names> </name></person-group><article-title>Characterization of the cold and hot natures of raw and processed Rehmanniae Radix by integrated metabolomics and network pharmacology</article-title><source>Phytomedicine</source><year>2020</year><month>08</month><volume>74</volume><fpage>153071</fpage><pub-id pub-id-type="doi">10.1016/j.phymed.2019.153071</pub-id><pub-id pub-id-type="medline">31537418</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ma</surname><given-names>T</given-names> </name><name name-style="western"><surname>Tan</surname><given-names>C</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>M</given-names> </name><name name-style="western"><surname>Ding</surname><given-names>W</given-names> </name><name name-style="western"><surname>Li</surname><given-names>S</given-names> </name></person-group><article-title>Bridging the gap between traditional Chinese medicine and systems biology: the connection of cold syndrome and NEI network</article-title><source>Mol Biosyst</source><year>2010</year><month>04</month><volume>6</volume><issue>4</issue><fpage>613</fpage><lpage>619</lpage><pub-id pub-id-type="doi">10.1039/b914024g</pub-id><pub-id pub-id-type="medline">20237638</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Jin</surname><given-names>X</given-names> </name><name name-style="western"><surname>Fan</surname><given-names>Q</given-names> </name><etal/></person-group><article-title>Deciphering the active compounds and mechanisms of HSBDF for treating ALI via integrating chemical bioinformatics analysis</article-title><source>Front Pharmacol</source><year>2022</year><volume>13</volume><fpage>879268</fpage><pub-id pub-id-type="doi">10.3389/fphar.2022.879268</pub-id><pub-id pub-id-type="medline">35721141</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wei</surname><given-names>J</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zeng</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Precise investigation of the efficacy of multicomponent drugs against pneumonia infected with influenza virus</article-title><source>Front Pharmacol</source><year>2021</year><volume>12</volume><fpage>604009</fpage><pub-id pub-id-type="doi">10.3389/fphar.2021.604009</pub-id><pub-id pub-id-type="medline">34867309</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>ZY</given-names> </name><name name-style="western"><surname>Fu</surname><given-names>SZ</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Impact of Shenfu injection on a composite of organ dysfunction development in critically ill patients with coronavirus disease 2019 (COVID-19): a structured summary of a study protocol for a randomized controlled trial</article-title><source>Trials</source><year>2020</year><month>08</month><day>24</day><volume>21</volume><issue>1</issue><fpage>738</fpage><pub-id pub-id-type="doi">10.1186/s13063-020-04677-5</pub-id><pub-id pub-id-type="medline">32831151</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wu</surname><given-names>M</given-names> </name><name name-style="western"><surname>Zhao</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Dong</surname><given-names>X</given-names> </name><etal/></person-group><article-title>Artificial intelligence-based preoperative prediction system for diagnosis and prognosis in epithelial ovarian cancer: a multicenter study</article-title><source>Front Oncol</source><year>2022</year><volume>12</volume><fpage>975703</fpage><pub-id pub-id-type="doi">10.3389/fonc.2022.975703</pub-id><pub-id pub-id-type="medline">36212430</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shi</surname><given-names>N</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>B</given-names> </name><name name-style="western"><surname>Liang</surname><given-names>N</given-names> </name><etal/></person-group><article-title>Association between early treatment with Qingfei Paidu decoction and favorable clinical outcomes in patients with COVID-19: a retrospective multicenter cohort study</article-title><source>Pharmacol Res</source><year>2020</year><month>11</month><volume>161</volume><fpage>105290</fpage><pub-id pub-id-type="doi">10.1016/j.phrs.2020.105290</pub-id><pub-id pub-id-type="medline">33181320</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zheng</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Jin</surname><given-names>D</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Understanding COVID-19 in Wuhan from the perspective of cold-dampness: clinical evidences and mechanisms</article-title><source>Front Med (Lausanne)</source><year>2021</year><volume>8</volume><fpage>617659</fpage><pub-id pub-id-type="doi">10.3389/fmed.2021.617659</pub-id><pub-id pub-id-type="medline">33693014</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>D</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>B</given-names> </name><name name-style="western"><surname>Lv</surname><given-names>JT</given-names> </name><name name-style="western"><surname>Sa</surname><given-names>RN</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>XM</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>ZJ</given-names> </name></person-group><article-title>The clinical benefits of Chinese patent medicines against COVID-19 based on current evidence</article-title><source>Pharmacol Res</source><year>2020</year><month>07</month><volume>157</volume><fpage>104882</fpage><pub-id pub-id-type="doi">10.1016/j.phrs.2020.104882</pub-id><pub-id pub-id-type="medline">32380051</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Ni</surname><given-names>W</given-names> </name><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>J</given-names> </name></person-group><article-title>Artificial intelligence&#x2013;based traditional Chinese medicine assistive diagnostic system: validation study</article-title><source>JMIR Med Inform</source><year>2020</year><month>06</month><day>15</day><access-date>2025-06-24</access-date><volume>8</volume><issue>6</issue><fpage>e17608</fpage><comment><ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/2020/6/e17608/">https://medinform.jmir.org/2020/6/e17608/</ext-link></comment><pub-id pub-id-type="doi">10.2196/17608</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wen</surname><given-names>G</given-names> </name><name name-style="western"><surname>Ma</surname><given-names>J</given-names> </name><name name-style="western"><surname>Hu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Li</surname><given-names>H</given-names> </name><name name-style="western"><surname>Jiang</surname><given-names>L</given-names> </name></person-group><article-title>Grouping attributes zero-shot learning for tongue constitution recognition</article-title><source>Artif Intell Med</source><year>2020</year><month>09</month><volume>109</volume><fpage>101951</fpage><pub-id pub-id-type="doi">10.1016/j.artmed.2020.101951</pub-id><pub-id pub-id-type="medline">34756217</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wu</surname><given-names>HK</given-names> </name><name name-style="western"><surname>Ko</surname><given-names>YS</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>YS</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>HT</given-names> </name><name name-style="western"><surname>Tsai</surname><given-names>TH</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>HH</given-names> </name></person-group><article-title>The correlation between pulse diagnosis and constitution identification in traditional Chinese medicine</article-title><source>Complement Ther Med</source><year>2017</year><month>02</month><volume>30</volume><fpage>107</fpage><lpage>112</lpage><pub-id pub-id-type="doi">10.1016/j.ctim.2016.12.005</pub-id><pub-id pub-id-type="medline">28137520</pub-id></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lin</surname><given-names>L</given-names> </name><name name-style="western"><surname>Zhao</surname><given-names>P</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>Z</given-names> </name><etal/></person-group><article-title>Identification strategy of cold and hot properties of Chinese herbal medicines based on artificial intelligence and biological experiments</article-title><source>Chin Med J</source><year>2025</year><volume>138</volume><issue>6</issue><fpage>745</fpage><lpage>747</lpage><pub-id pub-id-type="doi">10.1097/CM9.0000000000003509</pub-id></nlm-citation></ref><ref id="ref50"><label>50</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wei</surname><given-names>G</given-names> </name><name name-style="western"><surname>Fu</surname><given-names>X</given-names> </name><name name-style="western"><surname>He</surname><given-names>X</given-names> </name><etal/></person-group><article-title>Cold-hot nature identification based on GC similarity analysis of Chinese herbal medicine ingredients</article-title><source>RSC Adv</source><year>2021</year><month>07</month><day>27</day><volume>11</volume><issue>42</issue><fpage>26008</fpage><lpage>26015</lpage><pub-id pub-id-type="doi">10.1039/d1ra04189d</pub-id><pub-id pub-id-type="medline">35479454</pub-id></nlm-citation></ref><ref id="ref51"><label>51</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gu</surname><given-names>SF</given-names> </name><name name-style="western"><surname>Li</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>ZX</given-names> </name><name name-style="western"><surname>Jin</surname><given-names>L</given-names> </name><name name-style="western"><surname>Li</surname><given-names>MQ</given-names> </name></person-group><article-title>Clinical observation on the combination of traditional Chinese medicine Master Li Jiren&#x2019;s experience formula and olistavir in the treatment of viral pneumonia</article-title><source>GmjCM</source><year>2023</year><volume>38</volume><issue>8</issue><fpage>1550</fpage><lpage>1553</lpage><pub-id pub-id-type="doi">10.3969/j.issn.1003-8914.2023.08.041</pub-id></nlm-citation></ref><ref id="ref52"><label>52</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sun</surname><given-names>TF</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>JW</given-names> </name><name name-style="western"><surname>Gao</surname><given-names>Q</given-names> </name></person-group><article-title>The effects of Qingfei Paidu decoction on the time of disappearance of major symptoms, serum D-dimer levels, and erythrocyte sedimentation rate in patients with viral pneumonia</article-title><source>J Shenyang Pharm Univ</source><year>2021</year><volume>38</volume><issue>S2</issue><fpage>70</fpage><lpage>71</lpage></nlm-citation></ref><ref id="ref53"><label>53</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>ZZ</given-names> </name><name name-style="western"><surname>Fang</surname><given-names>YF</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Logistic regression analysis of damp-heat and cold-damp impeding syndrome of rheumatoid arthritis: a perspective in Chinese medicine</article-title><source>Chin J Integr Med</source><year>2012</year><month>08</month><volume>18</volume><issue>8</issue><fpage>575</fpage><lpage>581</lpage><pub-id pub-id-type="doi">10.1007/s11655-012-1172-1</pub-id><pub-id pub-id-type="medline">22855033</pub-id></nlm-citation></ref><ref id="ref54"><label>54</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Qu</surname><given-names>JX</given-names> </name><name name-style="western"><surname>Gu</surname><given-names>L</given-names> </name><name name-style="western"><surname>Pu</surname><given-names>ZH</given-names> </name><etal/></person-group><article-title>Viral etiology of community-acquired pneumonia among adolescents and adults with mild or moderate severity and its relation to age and severity</article-title><source>BMC Infect Dis</source><year>2015</year><month>02</month><day>22</day><volume>15</volume><fpage>89</fpage><pub-id pub-id-type="doi">10.1186/s12879-015-0808-0</pub-id><pub-id pub-id-type="medline">25812108</pub-id></nlm-citation></ref><ref id="ref55"><label>55</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bekdas</surname><given-names>M</given-names> </name><name name-style="western"><surname>Goksugur</surname><given-names>SB</given-names> </name><name name-style="western"><surname>Sarac</surname><given-names>EG</given-names> </name><name name-style="western"><surname>Erkocoglu</surname><given-names>M</given-names> </name><name name-style="western"><surname>Demircioglu</surname><given-names>F</given-names> </name></person-group><article-title>Neutrophil/lymphocyte and C-reactive protein/mean platelet volume ratios in differentiating between viral and bacterial pneumonias and diagnosing early complications in children</article-title><source>Saudi Med J</source><year>2014</year><month>05</month><volume>35</volume><issue>5</issue><fpage>442</fpage><lpage>447</lpage><pub-id pub-id-type="medline">24825803</pub-id></nlm-citation></ref><ref id="ref56"><label>56</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhuang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>L</given-names> </name><name name-style="western"><surname>Jiang</surname><given-names>N</given-names> </name><name name-style="western"><surname>Ge</surname><given-names>Y</given-names> </name></person-group><article-title>TCM-KLLaMA: Intelligent generation model for Traditional Chinese Medicine Prescriptions based on knowledge graph and large language model</article-title><source>Comput Biol Med</source><year>2025</year><month>05</month><volume>189</volume><fpage>109887</fpage><pub-id pub-id-type="doi">10.1016/j.compbiomed.2025.109887</pub-id><pub-id pub-id-type="medline">40056842</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>All clinical features information of patients with viral pneumonia.</p><media xlink:href="medinform_v13i1e64725_app1.docx" xlink:title="DOCX File, 18 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>The traditional Chinese medicine symptom scoring scale for patients with viral pneumonia.</p><media xlink:href="medinform_v13i1e64725_app2.docx" xlink:title="DOCX File, 19 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>The optimal features for the TCM cold and hot syndrome discrimination of viral pneumonia. AGE: age; AST/ALT: aspartate transaminase/alanine transaminase; CREA: creatinine; CRP: C-reactive protein; GLO: globulin; IBIL: unconjugated bilirubin; NEU%: neutrophil percentage; PCT: thrombocytocrit; RDW-SD: red cell distribution width-SD; T: temperature; TBIL: total bilirubin; TCHO: total cholesterol; WBC: white blood cell.</p><media xlink:href="medinform_v13i1e64725_app3.png" xlink:title="PNG File, 588 KB"/></supplementary-material><supplementary-material id="app4"><label>Multimedia Appendix 4</label><p>The performance evaluation of the cold and hot syndrome identification model based on traditional Chinese medicine (TCM) features. (A) The performance evaluation&#x2019;s radar chart of the 8 models based on TCM features. (B) The confusion matrix analysis of the 8 models based on TCM features.</p><media xlink:href="medinform_v13i1e64725_app4.docx" xlink:title="DOCX File, 351 KB"/></supplementary-material><supplementary-material id="app5"><label>Multimedia Appendix 5</label><p>Heat diagram of traditional Chinese medicine features on 8 screened models (the values of gradient boosting machine, random forest, extreme gradient boosting, and light gradient boosting were obtained using feature importance, and those of ridge regression, least absolute shrinkage and selection operator, support vector machine, and logistic regression were obtained using coef).</p><media xlink:href="medinform_v13i1e64725_app5.docx" xlink:title="DOCX File, 1324 KB"/></supplementary-material></app-group></back></article>