<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id><journal-id journal-id-type="publisher-id">medinform</journal-id><journal-id journal-id-type="index">7</journal-id><journal-title>JMIR Medical Informatics</journal-title><abbrev-journal-title>JMIR Med Inform</abbrev-journal-title><issn pub-type="epub">2291-9694</issn></journal-meta><article-meta><article-id pub-id-type="publisher-id">45523</article-id><article-id pub-id-type="doi">10.2196/45523</article-id><title-group><article-title>Establishment of a Public Mental Health Database for Research Purposes in the Ferrara Province: Development and Preliminary Evaluation Study</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Ferrara</surname><given-names>Maria</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Gentili</surname><given-names>Elisabetta</given-names></name><degrees>MA</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Belvederi Murri</surname><given-names>Martino</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Zese</surname><given-names>Riccardo</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Alberti</surname><given-names>Marco</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff6">6</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Franchini</surname><given-names>Giorgia</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff7">7</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Domenicano</surname><given-names>Ilaria</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Folesani</surname><given-names>Federica</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Sorio</surname><given-names>Cristina</given-names></name><degrees>MPH</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Benini</surname><given-names>Lorenzo</given-names></name><degrees>BA</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Carozza</surname><given-names>Paola</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Little</surname><given-names>Julian</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff8">8</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Grassi</surname><given-names>Luigi</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib></contrib-group><aff id="aff1"><institution>Institute of Psychiatry, Department of Neuroscience and Rehabilitation, University of Ferrara</institution>, <addr-line>Ferrara</addr-line>, <country>Italy</country></aff><aff id="aff2"><institution>Integrated Department of Mental Health and Pathological Addictions, Ferrara Local Health Trust</institution>, <addr-line>Ferrara</addr-line>, <country>Italy</country></aff><aff id="aff3"><institution>Department of Psychiatry, Yale School of Medicine</institution>, <addr-line>New Haven</addr-line><addr-line>CT</addr-line>, <country>United States</country></aff><aff id="aff4"><institution>Department of Engineering, University of Ferrara</institution>, <addr-line>Ferrara</addr-line>, <country>Italy</country></aff><aff id="aff5"><institution>Department of Chemical, Pharmaceutical and Agricultural Sciences, University of Ferrara</institution>, <addr-line>Ferrara</addr-line>, <country>Italy</country></aff><aff id="aff6"><institution>Department of Mathematics and Computer Science, University of Ferrara</institution>, <addr-line>Ferrara</addr-line>, <country>Italy</country></aff><aff id="aff7"><institution>Department of Physics, Informatics and Mathematics, University of Modena and Reggio Emilia</institution>, <addr-line>Modena</addr-line>, <country>Italy</country></aff><aff id="aff8"><institution>School of Epidemiology and Public Health, University of Ottawa</institution>, <addr-line>Ottawa</addr-line><addr-line>ON</addr-line>, <country>Canada</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Lovis</surname><given-names>Christian</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Mehta</surname><given-names>Nishita</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Maria Ferrara, MD, PhD<email>maria.ferrara@unife.it</email></corresp></author-notes><pub-date pub-type="collection"><year>2023</year></pub-date><pub-date pub-type="epub"><day>9</day><month>8</month><year>2023</year></pub-date><volume>11</volume><elocation-id>e45523</elocation-id><history><date date-type="received"><day>05</day><month>01</month><year>2023</year></date><date date-type="rev-recd"><day>04</day><month>05</month><year>2023</year></date><date date-type="accepted"><day>01</day><month>06</month><year>2023</year></date></history><copyright-statement>&#x00A9; Maria Ferrara, Elisabetta Gentili, Martino Belvederi Murri, Riccardo Zese, Marco Alberti, Giorgia Franchini, Ilaria Domenicano, Federica Folesani, Cristina Sorio, Lorenzo Benini, Paola Carozza, Julian Little, Luigi Grassi. Originally published in JMIR Medical Informatics (<ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org">https://medinform.jmir.org</ext-link>), 09.08.2023. </copyright-statement><copyright-year>2023</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/">https://medinform.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://medinform.jmir.org/2023/1/e45523"/><abstract><sec><title>Background</title><p>The immediate use of data exported from electronic health records (EHRs) for research is often limited by the necessity to transform data elements into an actual data set.</p></sec><sec><title>Objective</title><p>This paper describes the methodology for establishing a data set that originated from an EHR registry that included clinical, health service, and sociodemographic information.</p></sec><sec sec-type="methods"><title>Methods</title><p>The Extract, Transform, Load process was applied to raw data collected at the Integrated Department of Mental Health and Pathological Addictions in Ferrara, Italy, from 1925 to February 18, 2021, to build the new, anonymized Ferrara-Psychiatry (FEPSY) database. Information collected before the first EHR was implemented (ie, in 1991) was excluded. An unsupervised cluster analysis was performed to identify patient subgroups to support the proof of concept.</p></sec><sec sec-type="results"><title>Results</title><p>The FEPSY database included 3,861,432 records on 46,222 patients. Since 1991, each year, a median of 1404 (IQR 1117.5-1757.7) patients had newly accessed care, and a median of 7300 (IQR 6109.5-9397.5) patients were actively receiving care. Among 38,022 patients with a mental disorder, 2 clusters were identified; the first predominantly included male patients who were aged 25 to 34 years at first presentation and were living with their parents, and the second predominantly included female patients who were aged 35 to 44 years and were living with their own families.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>The process for building the FEPSY database proved to be robust and replicable with similar health care data, even when they were not originally conceived for research purposes. The FEPSY database will enable future in-depth analyses regarding the epidemiology and social determinants of mental disorders, access to mental health care, and resource utilization.</p></sec></abstract><kwd-group><kwd>mental health</kwd><kwd>psychosis</kwd><kwd>epidemiology</kwd><kwd>electronic health registry</kwd><kwd>health care</kwd><kwd>machine learning</kwd><kwd>medical health records</kwd><kwd>electronic health records</kwd><kwd>clinical database</kwd><kwd>support</kwd><kwd>mental disorder</kwd><kwd>social determinants</kwd><kwd>mental health care</kwd><kwd>resource utilization</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Electronic health records (EHRs) assemble and enable access to large volumes of clinical and sociodemographic data that are routinely collected by local health authorities. EHRs offer a unique opportunity to conduct research on various topics, including, among others, the patterns of health care resource use and factors that influence the course and outcomes of mental disorders in large, representative samples [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. EHRs can be linked to data related to census and geolocalization information [<xref ref-type="bibr" rid="ref3">3</xref>]; such investigations span the epidemiology of mental disorders, hospitalization rates, morbidity, and mortality.</p><p>The breadth and nature of information represented in the sample of EHRs in the mental health sector make such information particularly suitable for using artificial intelligence (AI) and machine learning techniques, in addition to traditional methods (eg, linear regression models), in order to increase the potential for research on social and clinical factors [<xref ref-type="bibr" rid="ref4">4</xref>].</p><p>Applications that use AI take advantage of AI's ability to process large amounts of data in order to extract information or identify underlying patterns of relationships that conventional methods may overlook [<xref ref-type="bibr" rid="ref5">5</xref>]. AI may be particularly suitable for the investigation of large amounts of clinical data, thanks to (1) the flexibility and scalability of AI techniques, which are higher than those of traditional methods, and (2) the ability of AI to consider all of the available predictors (ie, not only a subset), which makes AI and, in particular, machine learning suitable for performing tasks such as classification, prediction, and resource optimization [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>].</p><p>Indeed, in recent years, the use of AI techniques in mental health care research have rapidly increased, including its use to identify a disease at its earliest stages, predict illness onset in vulnerable individuals, study illness progression, optimize treatment, and discover novel therapeutic agents [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref8">8</xref>].</p><p>As of yet, there are few examples (mainly from the United States) of how data collected from EHRs can be successfully adapted for analysis with AI. For example, Hughes et al [<xref ref-type="bibr" rid="ref9">9</xref>] analyzed clinical variables in the EHRs of 81,630 adults from 2 academic medical centers in Boston, Massachusetts (spanning 10 years) and identified predictors of treatment response for major depressive disorders.</p><p>Xu et al [<xref ref-type="bibr" rid="ref10">10</xref>] compiled a data set of 11,275 patients from 5 large medical centers across New York City by using EHR data collected between 2008 and 2017; they used machine learning methods to identify markers of depression phenotypes to inform clinical decisions about patients&#x2019; care. Pradier et al [<xref ref-type="bibr" rid="ref11">11</xref>] analyzed a data set of 67,807 individuals to predict the risk of receiving a misdiagnosis of bipolar disorder among individuals with depression, using only information retrieved from EHRs. Perlis et al [<xref ref-type="bibr" rid="ref12">12</xref>] applied natural language processing to classify the mood states of 127,504 patients, using data from an EHR.</p><p>In order to fully exploit the potential of EHRs for mental health research however, important issues need to be considered. One preliminary, controversial issue is whether the use of EHR data should be restricted to the purpose for which they were collected [<xref ref-type="bibr" rid="ref13">13</xref>]. Indeed, privacy constraints, data security, and overall ethics regulation must be taken into account when considering whether to use EHRs for research purposes [<xref ref-type="bibr" rid="ref6">6</xref>]. Nonetheless, nowadays, medical data that were originally collected for purposes other than research are being used to study health phenomena in many different fields, including mental health, substance use, noncommunicable diseases (eg, cancer), and health behaviors (eg, cancer screening) [<xref ref-type="bibr" rid="ref14">14</xref>]. A further challenge is that data may not be homogeneous or may not be collected systematically, and most data are not derived from structured scales or questionnaires. The adaptation of the EHR represents the first necessary step to planning research projects that include models for predicting health resource utilization, identifying predictors of diagnostic accuracy, and differentiating between remission and chronicity, as done in other fields such as oncology [<xref ref-type="bibr" rid="ref15">15</xref>].</p><p>Given this premise, the aim of this paper is to describe (1) the challenges and pitfalls that were encountered in the process of adapting EHR data derived from the public mental health agency in Ferrara, Italy, for research purposes and (2) the development of a data set that is suitable for analysis via AI and traditional techniques. In order to test the feasibility of using these data in analyses and the robustness of analyses based on such data, a clustering analysis was also performed, and preliminary results are presented herein.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Ethics Approval</title><p>Ethical approval was obtained by the Area Vasta Emilia Centro Ethical Committee on December 12, 2019 (protocol number: 197/2018/Oss/AUSLF). This study conforms to the principles expressed in the Declaration of Helsinki.</p></sec><sec id="s2-2"><title>Setting</title><p>In Italy, mental health care is provided by departments of mental health [<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref19">19</xref>]. The levels of care within each department of mental health include community-based mental health centers, hospital psychiatric inpatient units, and rehabilitation or residential facilities. Each community-based mental health center serves as a hub of psychiatric care for geographically defined catchment areas with 50,000 to 150,000 inhabitants [<xref ref-type="bibr" rid="ref20">20</xref>] In Ferrara, Northern Italy, the Integrated Department of Mental Health and Pathological Addiction covers an area of 2630 km<sup>&#x00B2;</sup>, with a catchment of 342,061 inhabitants as of 2020 [<xref ref-type="bibr" rid="ref21">21</xref>].</p></sec><sec id="s2-3"><title>Data Collection and EHRs</title><p>Data were collected in 2 periods that were distinct in terms of the methodology used, the psychiatric services delivered, and the level of digitalization. Data related to the first period, which began in 1925 and ended in 1990, were gathered mostly in a psychiatric asylum, during a time when digital health was not fully developed or adopted.</p><p>In 1991, the first structured EHR (ie, SIPER [Sistema Informativo Psichiatrico dell'Emilia-Romagna]) was introduced and implemented locally by the Local Health Trust of Ferrara for Mental Health in Adults. Different software programs were adopted during the years following the implementation of SIPER, and each new software program replaced the previous one by importing already existing data and adding new features (and thus information), as detailed in <xref ref-type="other" rid="box1">Textbox 1</xref>.</p><boxed-text id="box1"><title>Electronic health records implemented by the Local Health Trust of Ferrara for Mental Health in Adults in chronological order.</title><list list-type="order"><list-item><p>SIPER (Sistema Informativo Psichiatrico dell'Emilia-Romagna; 1991-1994) included individual demographic data, medical records, diagnoses, and health services.</p></list-item><list-item><p>CINECA (1994-1998) added the feature labeled as &#x201C;project,&#x201D; which was defined as the comprehensive set of treatments and activities offered to the patient.</p></list-item><list-item><p>GESAP (Gestione attivit&#x00E0; Psichiatrica; 1998-2004) added information about outpatient treatment; hospitalizations in inpatient units, long-term residences, and semiresidences; and outpatient services.</p></list-item><list-item><p>IPPOCRATE (GPI SRL; 2004-2008).</p></list-item><list-item><p>EFESO (Newteam SRL; 2008-2021) added the text field labeled &#x201C;evaluation and treatment area&#x201D; in the medical record, structured diagnostic evaluation, pharmacological treatment prescription and administration, clinical notes, attached documents, and a feature to identify structured clinical protocols (Percorso Diagnostico Terapeutico Assistenziale; diagnostic and therapeutic care pathway).</p></list-item><list-item><p>CURE (Cartella Unificata Regionale Elettronica; Engineering SpA; 2021 to present) added the registration of vital signs and laboratory tests, as well as legal and administrative documentation.</p></list-item></list></boxed-text></sec><sec id="s2-4"><title>Data Preparation</title><p>The first goal was the creation of a new, fully deidentified database with data available in EFESO (Newteam SRL)&#x2014;a necessary step for complying with privacy constraints.</p><p>In order to remove all protected health information (PHI), source data needed to be modified. This could not be done by directly editing data in EFESO, since the source could not be altered directly. Thus, the new research database&#x2014;the Ferrara-Psychiatry (FEPSY) database&#x2014;was built via the Extract, Transform, Load process, which is a 3-phase process [<xref ref-type="bibr" rid="ref22">22</xref>] in which data are first extracted from 1 source or multiple and possibly different sources (eg, databases, flat or formatted files, and web pages). Afterward, the extracted data are stored in a staging area, where they undergo transformation, such as filtering, cleaning, summarization, and normalization. Finally, the transformed data are loaded into the destination storage. For example, one type of transformation was record exclusion. We excluded records of patients that could not be unequivocally identified by the tax code&#x2014;a unique 16-digit alphanumeric code that identifies a person in Italian public administration forms.</p><p>While assessing the suitability of the FEPSY database for research purposes, we noted that historical information dating back up to 1925 had also been maintained in EFESO. We understood that such data were manually imported into the electronic databases that preceded SIPER (year 1991); however, because we could not confirm the procedures, scope, and quality of this historical data import, we decided to document the existence of these data but exclude them from analysis.</p><p>More details about the FEPSY database can be found in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. In Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, for each table in the FEPSY database, the total number of rows (number and percentage of records retained in the FEPSY database) is reported, alongside the number of records in the corresponding original EFESO table from which data were extracted (number of records in the corresponding EFESO table). As detailed in Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, of the 4,264,954 records, 3,861,432 (90.54%) were kept. These records included detailed information about the patient, their illness, and the treatments provided.</p><p>In Table S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, 2 types of anomalies for each table in the FEPSY database are described; one is date inconsistency (eg, when the closing date precedes the opening date of the medical chart), and the other is a date anomaly that was generated by the automatized mechanism that was introduced by EFESO when migrating data from IPPOCRATE (GPI SRL; August 26, 2008).</p></sec><sec id="s2-5"><title>Clustering</title><p>Once the anonymized database was built, a clustering analysis was performed to investigate the data set quality. A clustering algorithm is an unsupervised machine learning technique that is used to group objects, so that objects of the same group (or cluster) are very similar to one another and objects of different groups are very dissimilar. To decide the degree of similarity (or dissimilarity) between 2 objects, various distance measures can be used, such as the Euclidean distance between (normalized) numerical representations of the objects. We tested the hypothesis that the patients modeled in the data set could be divided into homogeneous clusters. The k-means algorithm computes a numerical distance between objects to determine to which cluster they belong. However, in our case, data were categorical. In 1995, Ralambondrainy [<xref ref-type="bibr" rid="ref23">23</xref>] introduced an approach that enables the use of the k-means algorithm with categorical data. In this approach, nominal attributes are converted into binary attributes&#x2014;one for each value that the attribute can take&#x2014;so that they can be considered as numerical attributes by the algorithm.</p><p>We performed the clustering analysis with the WEKA (Waikato Environment for Knowledge Analysis; University of Waikato) data mining tool, which provides an implementation of the k-means algorithm (ie, SimpleKMeans) and can handle categorical data [<xref ref-type="bibr" rid="ref24">24</xref>]. SimpleKMeans can also handle missing values by replacing them with the mean or mode.</p><p>For this preliminary clustering analysis, we included only the patients who had at least one recorded diagnosis of a mental disorder (ie, <italic>International Classification of Diseases, Ninth Revision</italic> [<italic>ICD-9</italic>] codes 290-319) [<xref ref-type="bibr" rid="ref25">25</xref>].</p><p>Patients were excluded if they had nonpsychiatric diagnoses (<italic>ICD-9</italic> codes V01-V91; 2707/46,222, 5.86%) or had never received an <italic>ICD-9</italic> diagnosis (5493/46,222, 11.88%). The resulting subset for the clustering analysis included 38,022 patients.</p><p>We considered sociodemographic variables, such as biological sex, age at first visit, nationality, marital status, living situation, education, occupational status, birthplace (district), and the catchment area (district) providing care (determined by domicile postal code or by residence postal code when the domicile was missing).</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Sociodemographic Characteristics</title><p>The sample included 46,222 individuals, whose sociodemographic characteristics are detailed in <xref ref-type="table" rid="table1">Table 1</xref>.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Sociodemographic characteristics of all of the individuals who accessed mental health services in the Ferrara province (1991-2021) and were included in the FEPSY<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> database.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="top" colspan="2">Characteristic</td><td align="left" valign="top">Female patients (n=28,109)</td><td align="left" valign="top">Male patients (n=18,113)</td><td align="left" valign="top">All patients (N=46,222)</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="2"><bold>Age at first visit (years), mean (SD)</bold></td><td align="left" valign="top">50.46 (18.82)</td><td align="left" valign="top">48.72 (19.02)</td><td align="left" valign="top">49.78 (18.91)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">&#x003C;18, n (%)</td><td align="left" valign="top">249 (0.89)</td><td align="left" valign="top">164 (0.91)</td><td align="left" valign="top">413 (0.89)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">18-24, n (%)</td><td align="left" valign="top">2173 (7.73)</td><td align="left" valign="top">1842 (10.17)</td><td align="left" valign="top">4015 (8.69)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">25-34, n (%)</td><td align="left" valign="top">4221 (15.02)</td><td align="left" valign="top">2913 (16.08)</td><td align="left" valign="top">7134 (15.43)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">35-44, n (%)</td><td align="left" valign="top">5141 (18.29)</td><td align="left" valign="top">3308 (18.26)</td><td align="left" valign="top">8449 (18.28)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">45-54, n (%)</td><td align="left" valign="top">4761 (16.94)</td><td align="left" valign="top">3119 (17.22)</td><td align="left" valign="top">7880 (17.05)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">55-64, n (%)</td><td align="left" valign="top">4142 (14.74)</td><td align="left" valign="top">2423 (13.38)</td><td align="left" valign="top">6565 (14.20)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">65-74, n (%)</td><td align="left" valign="top">3780 (13.45)</td><td align="left" valign="top">2180 (12.04)</td><td align="left" valign="top">5960 (12.89)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">&#x2265;75, n (%)</td><td align="left" valign="top">3634 (12.93)</td><td align="left" valign="top">2160 (11.93)</td><td align="left" valign="top">5794 (12.54)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing data, n (%)</td><td align="left" valign="top">8 (0.03)</td><td align="left" valign="top">4 (0.02)</td><td align="left" valign="top">12 (0.03)</td></tr><tr><td align="left" valign="top" colspan="5"><bold>Nationality, n (%)</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Italian</td><td align="left" valign="top">26,486 (94.23)</td><td align="left" valign="top">17,167 (94.78)</td><td align="left" valign="top">43,653 (94.44)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Foreign</td><td align="left" valign="top">1580 (5.62)</td><td align="left" valign="top">920 (5.08)</td><td align="left" valign="top">2500 (5.41)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing data</td><td align="left" valign="top">43 (0.15)</td><td align="left" valign="top">26 (0.14)</td><td align="left" valign="top">69 (0.15)</td></tr><tr><td align="left" valign="top" colspan="5"><bold>Birthplace (district), n (%)</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Outside Ferrara province</td><td align="left" valign="top">7525 (26.77)</td><td align="left" valign="top">4825 (26.64)</td><td align="left" valign="top">12,350 (26.72)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Ferrara</td><td align="left" valign="top">7299 (25.97)</td><td align="left" valign="top">5034 (27.79)</td><td align="left" valign="top">12,333 (26.68)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Codigoro</td><td align="left" valign="top">3414 (12.15)</td><td align="left" valign="top">2167 (11.96)</td><td align="left" valign="top">5581 (12.07)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Portomaggiore</td><td align="left" valign="top">2803 (9.97)</td><td align="left" valign="top">1795 (9.91)</td><td align="left" valign="top">4598 (9.95)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Copparo</td><td align="left" valign="top">2439 (8.68)</td><td align="left" valign="top">1466 (8.09)</td><td align="left" valign="top">3905 (8.45)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Cento</td><td align="left" valign="top">2262 (8.05)</td><td align="left" valign="top">1463 (8.08)</td><td align="left" valign="top">3725 (8.06)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Outside Italy</td><td align="left" valign="top">2253 (8.02)</td><td align="left" valign="top">1258 (6.95)</td><td align="left" valign="top">3511 (7.60)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing data</td><td align="left" valign="top">114 (0.41)</td><td align="left" valign="top">105 (0.58)</td><td align="left" valign="top">219 (0.47)</td></tr><tr><td align="left" valign="top" colspan="5"><bold>Marital status, n (%)</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Married or partnered</td><td align="left" valign="top">10,748 (38.24)</td><td align="left" valign="top">6001 (33.13)</td><td align="left" valign="top">16,749 (36.24)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Single</td><td align="left" valign="top">5551 (19.75)</td><td align="left" valign="top">5721 (31.59)</td><td align="left" valign="top">11,272 (24.39)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Separated, divorced, or widowed</td><td align="left" valign="top">5587 (19.88)</td><td align="left" valign="top">1744 (9.63)</td><td align="left" valign="top">7331 (15.86)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing data</td><td align="left" valign="top">6223 (22.14)</td><td align="left" valign="top">4647 (25.66)</td><td align="left" valign="top">10,870 (23.52)</td></tr><tr><td align="left" valign="top" colspan="5"><bold>Living situation, n (%)</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Living with acquired family (partner and children)</td><td align="left" valign="top">12,147 (43.21)</td><td align="left" valign="top">6148 (33.94)</td><td align="left" valign="top">18,295 (39.58)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Living with parents</td><td align="left" valign="top">3079 (10.95)</td><td align="left" valign="top">3338 (18.43)</td><td align="left" valign="top">6417 (13.88)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Alone</td><td align="left" valign="top">3194 (11.36)</td><td align="left" valign="top">1768 (9.76)</td><td align="left" valign="top">4962 (10.74)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Living with other family members</td><td align="left" valign="top">1649 (5.87)</td><td align="left" valign="top">781 (4.31)</td><td align="left" valign="top">2430 (5.26)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Living with others (eg, roommates)</td><td align="left" valign="top">612 (2.18)</td><td align="left" valign="top">403 (2.22)</td><td align="left" valign="top">1015 (2.20)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Community housing facilities</td><td align="left" valign="top">184 (0.65)</td><td align="left" valign="top">267 (1.47)</td><td align="left" valign="top">451 (0.98)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Other</td><td align="left" valign="top">193 (0.69)</td><td align="left" valign="top">220 (1.21)</td><td align="left" valign="top">413 (0.89)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Safe house</td><td align="left" valign="top">181 (0.64)</td><td align="left" valign="top">199 (1.10)</td><td align="left" valign="top">380 (0.82)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Retirement home</td><td align="left" valign="top">226 (0.8)</td><td align="left" valign="top">146 (0.81)</td><td align="left" valign="top">372 (0.80)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Prison</td><td align="left" valign="top">1 (3.56&#x00D7;10<sup>&#x2212;5</sup>)</td><td align="left" valign="top">16 (0.09)</td><td align="left" valign="top">17 (0.04)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing data</td><td align="left" valign="top">6643 (23.63)</td><td align="left" valign="top">4827 (26.65)</td><td align="left" valign="top">11,470 (24.82)</td></tr><tr><td align="left" valign="top" colspan="5"><bold>Education, n (%)</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Illiterate</td><td align="left" valign="top">2941 (10.46)</td><td align="left" valign="top">1540 (8.50)</td><td align="left" valign="top">4481 (9.69)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Literate (without formal degree)</td><td align="left" valign="top">3044 (10.83)</td><td align="left" valign="top">2312 (12.76)</td><td align="left" valign="top">5356 (11.59)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Primary school</td><td align="left" valign="top">3674 (13.07)</td><td align="left" valign="top">2167 (11.96)</td><td align="left" valign="top">5841 (12.64)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Middle school</td><td align="left" valign="top">3247 (11.55)</td><td align="left" valign="top">2644 (14.60)</td><td align="left" valign="top">5891 (12.75)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">High school</td><td align="left" valign="top">3946 (14.04)</td><td align="left" valign="top">2378 (13.13)</td><td align="left" valign="top">6324 (13.68)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">College or university</td><td align="left" valign="top">1294 (4.60)</td><td align="left" valign="top">584 (3.22)</td><td align="left" valign="top">1878 (4.06)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Missing data</td><td align="left" valign="top">9963 (35.44)</td><td align="left" valign="top">6488 (35.82)</td><td align="left" valign="top">16,451 (35.59)</td></tr><tr><td align="left" valign="top" colspan="5"><bold>Occupational status, n (%)</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Employed</td><td align="left" valign="top">3873 (13.78)</td><td align="left" valign="top">2735 (15.10)</td><td align="left" valign="top">6608 (14.30)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Retired</td><td align="left" valign="top">2949 (10.49)</td><td align="left" valign="top">1833 (10.12)</td><td align="left" valign="top">4782 (10.35)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Unemployed</td><td align="left" valign="top">1531 (5.45)</td><td align="left" valign="top">1291 (7.13)</td><td align="left" valign="top">2822 (6.11)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Disability</td><td align="left" valign="top">612 (2.18)</td><td align="left" valign="top">670 (3.70)</td><td align="left" valign="top">1282 (2.77)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Other</td><td align="left" valign="top">760 (2.70)</td><td align="left" valign="top">491 (2.71)</td><td align="left" valign="top">1251 (2.71)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Homemaker</td><td align="left" valign="top">944 (3.36)</td><td align="left" valign="top">1 (0.01)</td><td align="left" valign="top">945 (2.04)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Student</td><td align="left" valign="top">512 (1.82)</td><td align="left" valign="top">334 (1.84)</td><td align="left" valign="top">846 (1.83)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Unknown</td><td align="left" valign="top">16,928 (60.22)</td><td align="left" valign="top">10,758 (59.39)</td><td align="left" valign="top">27,686 (59.90)</td></tr><tr><td align="left" valign="top" colspan="5"><bold>Catchment area (district), n (%)</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Ferrara</td><td align="left" valign="top">10,964 (39.01)</td><td align="left" valign="top">6784 (37.45)</td><td align="left" valign="top">17,748 (38.40)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Codigoro</td><td align="left" valign="top">4186 (14.89)</td><td align="left" valign="top">2931 (16.18)</td><td align="left" valign="top">7117 (15.40)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Portomaggiore</td><td align="left" valign="top">3425 (12.18)</td><td align="left" valign="top">2193 (12.11)</td><td align="left" valign="top">5618 (12.15)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Cento</td><td align="left" valign="top">3380 (12.02)</td><td align="left" valign="top">2097 (11.58)</td><td align="left" valign="top">5477 (11.85)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Copparo</td><td align="left" valign="top">2754 (9.80)</td><td align="left" valign="top">1671 (9.23)</td><td align="left" valign="top">4425 (9.57)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Unknown</td><td align="left" valign="top">3400 (12.10)</td><td align="left" valign="top">2437 (13.45)</td><td align="left" valign="top">5837 (12.63)</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>FEPSY: Ferrara-Psychiatry.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-2"><title>Extract, Transform, Load Process</title><sec id="s3-2-1"><title>Built-In Tables</title><p>Built-in tables from the EFESO relational database, which are detailed in <xref ref-type="other" rid="box2">Textbox 2</xref>, were included in the FEPSY database.</p><boxed-text id="box2"><title>Built-in tables included in the FEPSY (Ferrara-Psychiatry) database.</title><list list-type="order"><list-item><p>Table <italic>Patients</italic> included individual personal data, such as name, place and date of birth, biological sex (male or female), home address, living condition, education, marital status, occupation, and other sociodemographic characteristics.</p></list-item><list-item><p>Table <italic>Medical Records</italic> contained 1 or more medical records for each patient, with information such as the date of admission, date and type of discharge, primary diagnosis of a mental disorder, and facility providing care.</p></list-item><list-item><p>Table <italic>Diagnoses</italic> included 1 or more diagnoses that were assigned to each individual. Diagnoses were classified according to the <italic>International Classification of Diseases, Ninth Revision</italic> (<italic>ICD-9</italic>) categorical system; therefore, every diagnosis included the associated <italic>ICD-9</italic> code, description, group, and chapter [<xref ref-type="bibr" rid="ref24">24</xref>]. Diagnoses recorded before the introduction of the <italic>ICD-9</italic> were recorded in SIPER (Sistema Informativo Psichiatrico dell'Emilia-Romagna), using standardized conversion criteria [<xref ref-type="bibr" rid="ref24">24</xref>].</p></list-item><list-item><p>Table <italic>Products</italic> referred to the different types of medical services, such as consultations or hospitalizations. A product had a start date and end date, and it may have contained 1 or more medical services.</p></list-item><list-item><p>Table <italic>Medical Services</italic> stored every service that each individual had received or undergone, such as consultations, first visits, the administration of pharmacological treatment, social skill&#x2013;oriented activities, structured diagnostic assessments, and mandatory medical treatments, as well as the facility providing care.</p></list-item><list-item><p>Tables <italic>Medication Prescription</italic> and <italic>Medication Administration</italic> referred to the prescription and administration of pharmacological treatment, type of medication and dosage, start and stop dates, and responsible facility.</p></list-item><list-item><p>Table <italic>Psychometric Tests</italic> included every test administered to each patient and the test types, dates, questions, and scores.</p></list-item><list-item><p>Table <italic>Projects</italic> listed the treatment plans for each patient. There were individual and group projects, and within a project, there could have been 1 or more products and medical services.</p></list-item><list-item><p>Table <italic>Facilities</italic> contained all of the facilities of the Health Trust of Ferrara for Mental Health in Adults, such as hospitals, day care centers, and clinics, along with their types and locations.</p></list-item></list></boxed-text></sec><sec id="s3-2-2"><title>Extract</title><p>Data were extracted from EFESO by using an automated procedure that executed an SQL select query. This query selected all relevant fields of a table and other useful information from linked support tables, such as the descriptions of the codes. The result of the query was stored in a Pandas DataFrame (The Pandas Development Team) [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>], which can be easily manipulated in the next phase.</p></sec><sec id="s3-2-3"><title>Transform</title><sec id="s3-2-3-1"><title>Record Exclusion</title><p>Data imported before 1991 were excluded (as detailed in the <italic>Data Preparation</italic> section). Some fields and records were removed [<xref ref-type="bibr" rid="ref22">22</xref>] to ensure data consistency, because there were duplicate or erroneous records (Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). These were (1) fields containing unreliable information, (2) fields that were present but not in use (their values were always null), and (3) all records marked as &#x201C;deleted&#x201D; (ie, wrong records that were not to be used) and all records in other tables referencing the &#x201C;deleted&#x201D; ones. We decided to remove 36 individuals that had unique fiscal codes but duplicate patient IDs&#x2014;corresponding to 0.15% (72/48,001) of the records in the total data set&#x2014;since it was not possible to determine which of the two entries was the correct one. When a patient was first included in the database, a unique identifier&#x2014;the patient ID&#x2014;was assigned. The combination of the tax code and the patient ID allowed for the unique identification of a patient in the database. We also excluded patients for whom a record was opened earlier than the birth date (16/48,001, 0.03%), patients with no medical records (603/48,001, 1.26%), and patients marked as &#x201C;deleted&#x201D; (77/48,001, 0.16%). Overall, 1.6% (768/48,001) of the total records, which related to 732 patients, were removed from the source table.</p></sec><sec id="s3-2-3-2"><title>Anonymization</title><p>Anonymization was necessary in order to use the extracted data for research projects and was performed on tables <italic>Patients</italic> and <italic>Medical Records</italic>. First, the extracted records were shuffled. Afterward, the original patient and medical record IDs were replaced with a universally unique identifier (UUID), which is a 128-bit string that is usually represented as a sequence of 32 hexadecimal digits [<xref ref-type="bibr" rid="ref28">28</xref>]. These new random, unique identifiers were generated with the <italic>uuid4</italic> function of the Python <italic>uuid</italic> package (Python Software Foundation) [<xref ref-type="bibr" rid="ref29">29</xref>] and used as the new primary key. In order to maintain the referential integrity (ie, the primary key of one table is a foreign key in another table, meaning that they are related), the old IDs were replaced with the new ones within every table in which they appeared. Furthermore, all PHI were excluded from table <italic>Patients</italic>; these data included first names, last names, days and months of birth, tax codes, home addresses, phone numbers, and note fields that could potentially include personal data (eg, relatives&#x2019; names). For the same reason, text note fields were also excluded from other tables, when present.</p></sec><sec id="s3-2-3-3"><title>Field Transformation</title><p>Transformation was necessary for date fields. EFESO stored dates in &#x201C;datetime&#x201D; format, that is, &#x201C;dd/mm/yyyy hh:mm.&#x201D; However, previous EHRs stored only the date, without the hour information. Furthermore, even when specified, the hour information is not always reliable. For this reason, the date fields were split into 2 fields&#x2014;one for the date and one for the time.</p></sec><sec id="s3-2-3-4"><title>Missing Values</title><p>Missing values were assessed to avoid the introduction of bias. In specific analyses, the level and pattern of missingness will be assessed for each variable included and dealt with accordingly.</p></sec></sec></sec><sec id="s3-3"><title>Load</title><p>Data extracted from EFESO were loaded in the FEPSY database&#x2014;the newly created MySQL (Oracle Corporation) relational database&#x2014;by using the same automated procedure that was used to extract them. For each built-in table, an insert query, which took the values from the same DataFrame of the select query, was executed.</p></sec><sec id="s3-4"><title>Analysis of the Extracted Data</title><p>The data included in the final composite FEPSY data set were those collected from 1991 to February 2021. Since 1991, each year, a median of 1404 (IQR 1117.5-1757.7) individuals had newly accessed care, and a median of 7300 (IQR 6109.5-9397.5) individuals were actively receiving care, as represented in <xref ref-type="fig" rid="figure1">Figure 1</xref>. <xref ref-type="fig" rid="figure2">Figure 2</xref> shows the number of patients treated per year in total and by sex. The sudden decrease observed in 2009 was due to an automated closing procedure that was introduced in 2008 and retained from then on. When migrating from IPPOCRATE to EFESO, all medical records, products, and diagnoses that had not been updated in 365 days were assumed to be closed or terminated, and the missing closing date was replaced with the date of the migration to EFESO, that is, August 26, 2008.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>New admissions per year in total and by sex (upper panel). Timeline of the electronic health records adopted by the health care agency in the Ferrara province (lower panel). CURE: Cartella Unificata Regionale Elettronica; GESAP: Gestione attivit&#x00E0; Psichiatrica; SIPER: Sistema Informativo Psichiatrico dell'Emilia-Romagna.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v11i1e45523_fig01.png"/></fig><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Patients receiving care from the mental health services in Ferrara over time (years 1991-2021), in total (continuous line) and by sex (dotted and dashed lines). CURE: Cartella Unificata Regionale Elettronica; GESAP: Gestione attivit&#x00E0; Psichiatrica. SIPER: Sistema Informativo Psichiatrico dell'Emilia-Romagna.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v11i1e45523_fig02.png"/></fig><p>As described in <xref ref-type="table" rid="table2">Table 2</xref>, the most frequent diagnoses at first admission were depression and anxiety disorder. During the 30-year time span, more than half (32,230/46,222, 69.73%) of the patients had only 1 chart open, and only 5184 patients had at least one psychiatric hospitalization.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Main clinical characteristics of the sample (N=46,222; years 1991-2021).</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom" colspan="2">Characteristics</td><td align="left" valign="bottom">Female patients (n=28,109, 68.81%)</td><td align="left" valign="bottom">Male patients (n=18,113, 39.19%)</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="4"><bold>Age at first visit</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Years, mean (SD)</td><td align="left" valign="top">50.46 (18.82)</td><td align="left" valign="top">48.72 (19.02)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Years, median (range)</td><td align="left" valign="top">49.0 (0-109)</td><td align="left" valign="top">47.0 (2-98)</td></tr><tr><td align="left" valign="top" colspan="4"><bold>Number of charts/patient</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Value, mean (SD)</td><td align="left" valign="top">1.62 (1.55)</td><td align="left" valign="top">1.64 (2.38)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Value, median (range)</td><td align="left" valign="top">1.0 (1-63)</td><td align="left" valign="top">1.0 (1-132)</td></tr><tr><td align="left" valign="top" colspan="2">Patients with at least one hospitalization, n</td><td align="left" valign="top">2680</td><td align="left" valign="top">2504</td></tr><tr><td align="left" valign="top" colspan="4"><bold>Number of hospitalizations/patient</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Value, mean (SD)</td><td align="left" valign="top">0.33 (2.36)</td><td align="left" valign="top">0.46 (2.35)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Value, median (range)</td><td align="left" valign="top">0 (0-143)</td><td align="left" valign="top">0 (0-102)</td></tr><tr><td align="left" valign="top" colspan="2">Patients with at least one compulsory admission, n (%)</td><td align="left" valign="top">415 (1.48)</td><td align="left" valign="top">485 (2.68)</td></tr><tr><td align="left" valign="top" colspan="4"><bold>Duration of hospitalization</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Days, mean (SD)</td><td align="left" valign="top">5.08 (40.89)</td><td align="left" valign="top">7.53 (62.39)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Days, median (range)</td><td align="left" valign="top">0 (0-2661)</td><td align="left" valign="top">0 (0-4090)</td></tr><tr><td align="left" valign="top" colspan="4"><bold>First recorded mental disorder diagnosis<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup>, n (%)</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Anxiety disorders</td><td align="left" valign="top">6884 (24.49)</td><td align="left" valign="top">3725 (20.57)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Dementia and other organic disorders</td><td align="left" valign="top">2092 (7.44)</td><td align="left" valign="top">1601 (8.84)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Depression</td><td align="left" valign="top">7648 (27.21)</td><td align="left" valign="top">3335 (18.41)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Drug and substance use or abuse</td><td align="left" valign="top">415 (1.48)</td><td align="left" valign="top">861 (4.75)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Eating disorders</td><td align="left" valign="top">241 (0.86)</td><td align="left" valign="top">18 (0.10)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Intellectual disability</td><td align="left" valign="top">468 (1.66)</td><td align="left" valign="top">636 (3.51)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Mania and bipolar disorders</td><td align="left" valign="top">713 (2.54)</td><td align="left" valign="top">460 (2.54)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Personality disorders</td><td align="left" valign="top">1287 (4.58)</td><td align="left" valign="top">1186 (6.55)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Schizophrenia and other nonorganic psychoses</td><td align="left" valign="top">1468 (5.22)</td><td align="left" valign="top">1515 (8.36)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Other mental disorders</td><td align="left" valign="top">2339 (8.32)</td><td align="left" valign="top">1130 (6.24)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">No formal mental disorder diagnosis</td><td align="left" valign="top">4554 (16.20)</td><td align="left" valign="top">3646 (20.13)</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>Mental disorder diagnoses: <italic>International Classification of Diseases, Ninth Revision</italic> codes 290.xx-319.xx.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-5"><title>Clustering Results</title><p>This analysis, which was carried out on the subset of 38,022 individuals who had at least one mental disorder diagnosis, identified 2 distinct clusters (<xref ref-type="fig" rid="figure3">Figure 3</xref>). One is represented by single male patients who were born in Ferrara, those who were living with parents, and those whose age at first visit was between 25 and 34 years; the other is represented by married female patients who were living with their own acquired families, those who were born outside the province of Ferrara, and those whose age at first visit was 35 to 44 years. The following sociodemographic features were similar in the two clusters: Italian nationality, individuals with a high school degree, employed individuals, and individuals who were receiving treatment in the Ferrara catchment area.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Results from the clustering analysis.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v11i1e45523_fig03.png"/></fig></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>This study describes the process of adapting one of the longest running EHRs of public mental health care for research purposes. The FEPSY data set covers a catchment area with 342,061 inhabitants (as of 2020) and includes a total of 46,222 unique individuals who had access to mental health services over a span of 30 years (1991-2021). The FEPSY database is suitable for descriptive, predictive, and inferential analyses via conventional analysis and AI techniques, as demonstrated by the preliminary findings of the clustering analysis. To our knowledge, our database is the first of its kind in Italy. In Europe, longitudinal and prospective registries have long been in use. For example, large data sets were extracted from the Danish National Patient Registry [<xref ref-type="bibr" rid="ref30">30</xref>] and the Danish Psychiatric Central Research Register [<xref ref-type="bibr" rid="ref31">31</xref>]. The first data set contained data on 8,085,603 patients, which were collected from 1977 to 2012. The second data set included data on a total of 747,176 patients, which were collected from 1970 to 2010. In both cases, the register contained dates of the onset and end of any treatment, diagnoses, types of referrals, and places of treatment, thereby allowing for the possibility to perform health registry&#x2013;based research [<xref ref-type="bibr" rid="ref32">32</xref>], considering a total population of approximately 27 million.</p><p>The main finding of this study is that data that were not originally conceived for research were successfully extracted from EHR software and loaded into a new anonymized database. This step is of foremost importance, as the data originated from an information system that was changed and updated multiple times and was not designed to allow for exploratory investigations in a structured manner. Thus, this new data set may represent the ideal setting to build, test, and refine an analytical methodology for extracting data and preparing these data for research purposes. This methodology could also be applied to other clinical data sets, such as data sets from other medical disciplines (eg, oncology), with characteristics that are similar to those of the FEPSY data set [<xref ref-type="bibr" rid="ref33">33</xref>]. Additionally, it will be of foremost importance to validate the methodological approach and findings of upcoming research originating from the FEPSY data set by proactively seeking collaboration with other research groups, in order to enable the replication of findings from the territory of Ferrara and the use of the FEPSY data set to replicate findings from research involving other registries.</p><p>This work also allows for collaborations in terms of learning health networks, which use comparable data that originate from EHRs to support clinical decisions, improve the delivery of efficient and effective medical care, and help with the integration of research in health care [<xref ref-type="bibr" rid="ref34">34</xref>-<xref ref-type="bibr" rid="ref36">36</xref>].</p><p>Our results will also pave the way for an in-depth study on the use of health care resources; the results will be used to develop a system that is capable of planning the use of such resources. Such a system would optimize the use of health care resources while maintaining or possibly improving the quality of treatment. For example, in Italy, Donisi et al [<xref ref-type="bibr" rid="ref37">37</xref>] predicted the cost of community mental health care by using clinical and sociodemographic information originating from the Psychiatric Case Register in the Verona Health District. This allowed for the linking of social deprivation to psychiatric service utilization [<xref ref-type="bibr" rid="ref38">38</xref>] and shed a light on possible contributors to social isolation in an already vulnerable population. Our clustering analysis, which was conducted on the FEPSY data set to test its feasibility and robustness, identified 2 clusters; women appeared to access mental health services later in life and were typically married, in comparison to men. These findings were consistent with the literature [<xref ref-type="bibr" rid="ref39">39</xref>-<xref ref-type="bibr" rid="ref41">41</xref>] and supported the ability of the extracted data to detect known patterns, even though the results should be interpreted with caution, given the large amount of missing sociodemographic data. Clustering analyses can be useful for building prediction models and planning a department's resource allocation, as they provide relevant information on patients at presentation and on illness trajectory [<xref ref-type="bibr" rid="ref42">42</xref>].</p><p>The process described in this paper faced 5 major challenges that we mitigated, as follows. First, the source data included several built-in structural informatic elements (so-called <italic>tables</italic>) that had to be screened and deleted in order to get to the core data. Second, the anonymization step was of absolute importance, and in order to both comply with privacy constraints and be able to preserve the integrity of the data, the study team decided to keep only subelements of certain data items (eg, for the birth date, only the year was kept, and for residence, only the postal code was kept). Third, in order to establish which records were correct, an iterative comparison of the FEPSY database and the local and regional database was performed by a third party who had access to PHI. Fourth, records that were deemed unreliable were excluded (eg, clinical procedures referring to nonexistent medical records). Furthermore, the data extracted from EFESO originated from different software and thus possibly generated some errors. In the FEPSY data set, these errors seem to be limited to records, and the proportion of records with errors was very low (49,854/3,861,432, 1.29%). In the end, we decided to exclude data that were collected before 1991 and duplicate patient records. Fifth, missing data challenges were also addressed, especially in the clustering process. For this purpose, the WEKA data mining tool was used.</p></sec><sec id="s4-2"><title>Strengths of This Study</title><p>The quality and completeness of the collected and cleaned data, as well as the large number of records stored in the FEPSY database, resulted in the definition of a data set that is particularly suitable for automatic analysis and has appealing characteristics for research, such as a long period of data availability, great diversity in the sociodemographic factors of the patients represented, and a history of treatments and drugs administered. This could possibly represent a strong foundation for many different studies of mental illness and resource use, favoring comparisons between Italy and other countries regarding the delivery and quality of community and hospital psychiatric care [<xref ref-type="bibr" rid="ref43">43</xref>-<xref ref-type="bibr" rid="ref45">45</xref>]. Furthermore, the newly created database does not include sensitive information, even though this information can be retrieved by using an external supporting table created ad hoc, which could link the FEPSY data set with other data sets (eg, hospital data and tumor registries) for future research.</p><p>The novelty of this project is represented by its interdisciplinary nature (psychiatry, public health, epidemiology, sociology, mathematics, computer science, and AI), the potential versatility of the methods that can be used with the FEPSY database, and the versatility of the systems that could be created via analyses involving the FEPSY database. To our knowledge, this study is the first attempt to retrospectively build a single data set that includes more than 30 years&#x2019; worth of data on mental health services in a specific area.</p><p>Such a data set would also allow for longitudinal analyses, such as those that have already been performed with the Nordic registry (a prospective registry) and, more recently, the South London and Maudsley National Health Service [<xref ref-type="bibr" rid="ref46">46</xref>] and the Camden &#x0026; Islington Research Database [<xref ref-type="bibr" rid="ref47">47</xref>].</p><p>We believe that historical data can add value to subsequent analyses, because they allow researchers to understand how mental health services have evolved over the past decades and the extent to which phenotypical presentations of different diseases have changed over time. In light of these considerations, factors that should be taken into account are (1) potential cohort and time effects, such as historical events (eg, the Great Recession in 2008); (2) changes in legal and medical approaches to mental health; and (3) changes in the classification of mental disorders [<xref ref-type="bibr" rid="ref48">48</xref>].</p></sec><sec id="s4-3"><title>Limitations</title><p>Our findings must be interpreted in the light of some limitations. First, the sample size is limited by the geographical catchment. A larger catchment or a more densely populated region would probably have a larger volume of treated individuals and thus have more data, which would facilitate machine learning analyses. However, we believe that even if the sample is limited by the geographical catchment, the diverse socioeconomic distribution in Ferrara is a strength that mitigates this limitation, providing insight into the possible moderator or mediator roles of socioeconomic variables that are considered social determinants of mental health. Second, another potential limitation is the missing data for some sociodemographic attributes, which may reduce the statistical power of a study [<xref ref-type="bibr" rid="ref49">49</xref>] or affect the accuracy of machine learning algorithms [<xref ref-type="bibr" rid="ref50">50</xref>]. In order to overcome this issue, missing values can be handled with multiple imputation methods or replaced with the mean or the mode (ie, for quantitative or qualitative data, respectively). Moreover, sociodemographic information can be drawn from external and publicly available sources, such as the Italian National Institute of Statistics [<xref ref-type="bibr" rid="ref51">51</xref>], which includes the census of the population as well as social, economic, and environmental surveys and analyses. Lastly, there is the risk of introducing bias while building prediction models, especially when using supervised machine learning techniques, due to small sample sizes and the poor handling of missing data and overfitting [<xref ref-type="bibr" rid="ref52">52</xref>]. With regard to the sample size, our sample appears to be sufficiently large for risk prediction analyses. Overfitting can be addressed with penalized models [<xref ref-type="bibr" rid="ref53">53</xref>].</p></sec><sec id="s4-4"><title>Future Directions</title><p>This work sets a starting point for future investigations, which can be described as follows: (1) identifying patients who have a higher severity index or chronicity level and those who require a greater use of health resources; (2) identifying and validating, by means of machine learning models, demographic, clinical, and social predictors of clinically relevant outcomes that are useful for an ad hoc programming of resources (eg, sex, gender, or social deprivation [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref54">54</xref>]); (3) further optimizing and tailoring the analysis methods, so that they can also be applied to other data sets (eg, the local mental health registries for child and adolescent neuropsychiatry and for drug addiction services); (4) interacting with international learning health networks [<xref ref-type="bibr" rid="ref55">55</xref>-<xref ref-type="bibr" rid="ref57">57</xref>]; and (5) linking the FEPSY data set with external data sources, such as census data, tumor registries [<xref ref-type="bibr" rid="ref58">58</xref>], death registries, and criminal justice data [<xref ref-type="bibr" rid="ref59">59</xref>]. As a result of the increasing digitalization of medical records, it was possible to gather years of mental health history for every patient. This will enable for the conduct of symbolic and subsymbolic analyses on time series via automatic methodologies. Classical supervised and unsupervised machine learning and deep learning techniques will be evaluated. In order to explore the relationship between sociodemographic characteristics and specific diagnostic questions (eg, the incidence and prevalence of psychosis), a supervised framework will be deployed, in which binary labels (eg, &#x201C;psychosis&#x201D; or &#x201C;no-psychosis&#x201D;) or multiple classification labels (eg, &#x201C;ICD-9 diagnosis&#x201D;) will be associated with the patient. The main problem to overcome will be the imbalance of the data set, that is, when there is an unequal distribution of classes in the data set. In such instances, a standard machine learning technique, such as a support vector machine or random forest [<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref61">61</xref>], will be applied. Moreover, each patient could potentially be considered as a distinct time series by including the temporal dimension of the treatment and by applying recurrent neural networks [<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref63">63</xref>]. By doing so, the prediction of the new onset of a disease and the subsequent use of health resources will be the focus, in order to plan and optimize health care resources.</p></sec><sec id="s4-5"><title>Conclusions</title><p>The process described in this study resulted in the building of a data set that included the information of 46,222 individuals who had access to psychiatric services in the Ferrara province over the course of almost 30 years. The preliminary findings from the clustering analysis confirmed the quality of the newly established database. The process we implemented proved to be a solid method that can be replicated with similar data sets, even if they were not originally compiled for research purposes.</p></sec></sec></body><back><ack><p>This work was supported by the &#x201C;Fondo per l&#x2019;Incentivazione alla Ricerca (FIR),&#x201D; granted by the University of Ferrara in 2021 to MF, with the project titled &#x201C;Intelligenza Artificiale per Predizione Diagnostica, di Carico Assistenziale, e di Esito: 40 Anni di accessi Presso i Centri di Salute Mentale della Provincia di Ferrara (AI4MentalHealth).&#x201D;</p></ack><fn-group><fn fn-type="con"><p>MF designed the study, wrote the first draft of the manuscript, and supervised the project. EG processed the experimental data, performed the analysis, and designed the figures. MBM, RZ, MA, GF, ID, FF, and LG were involved in planning and interpreting the results. CS, LB, and JL aided in interpreting the results. All authors discussed the results, commented on the manuscript, and approved the final version.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AI</term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb2">EHR</term><def><p>electronic health record</p></def></def-item><def-item><term id="abb3">FEPSY</term><def><p>Ferrara-Psychiatry</p></def></def-item><def-item><term id="abb4"><italic>ICD-9</italic></term><def><p><italic>International Classification of Diseases, Ninth Revision</italic></p></def></def-item><def-item><term id="abb5">PHI</term><def><p>protected health information</p></def></def-item><def-item><term id="abb6">SIPER</term><def><p>Sistema Informativo Psichiatrico dell'Emilia-Romagna</p></def></def-item><def-item><term id="abb7">UUID</term><def><p>universally unique identifier</p></def></def-item><def-item><term id="abb8">WEKA</term><def><p>Waikato Environment for Knowledge Analysis</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Braveman</surname><given-names>P</given-names></name><name name-style="western"><surname>Gottlieb</surname><given-names>L</given-names></name></person-group><article-title>The social determinants of health: it's time to consider the causes of the causes</article-title><source>Public Health Rep</source><year>2014</year><volume>129 Suppl 2</volume><issue>Suppl 2</issue><fpage>19</fpage><lpage>31</lpage><pub-id pub-id-type="doi">10.1177/00333549141291S206</pub-id><pub-id pub-id-type="medline">24385661</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="web"><person-group person-group-type="author"><collab>World Health Organization</collab></person-group><article-title>Social determinants of health</article-title><access-date>2023-07-4</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.who.int/health-topics/social-determinants-of-health#tab=tab_1">www.who.int/health-topics/social-determinants-of-health#tab=tab_1</ext-link></comment></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Marmot</surname><given-names>M</given-names></name><name name-style="western"><surname>Bell</surname><given-names>R</given-names></name></person-group><article-title>Social determinants and non-communicable diseases: time for integrated action</article-title><source>BMJ</source><year>2019</year><month>01</month><day>28</day><volume>364</volume><fpage>l251</fpage><pub-id pub-id-type="doi">10.1136/bmj.l251</pub-id><pub-id pub-id-type="medline">30692093</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Thieme</surname><given-names>A</given-names></name><name name-style="western"><surname>Belgrave</surname><given-names>D</given-names></name><name name-style="western"><surname>Doherty</surname><given-names>G</given-names></name></person-group><article-title>Machine learning in mental health: a systematic review of the HCI literature to support the development of effective and implementable ML systems</article-title><source>ACM Trans Comput Hum Interact</source><year>2020</year><month>08</month><day>17</day><volume>27</volume><issue>5</issue><fpage>1</fpage><lpage>53</lpage><pub-id pub-id-type="doi">10.1145/3398069</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mehta</surname><given-names>N</given-names></name><name name-style="western"><surname>Pandit</surname><given-names>A</given-names></name><name name-style="western"><surname>Shukla</surname><given-names>S</given-names></name></person-group><article-title>Transforming healthcare with big data analytics and artificial intelligence: A systematic mapping study</article-title><source>J Biomed Inform</source><year>2019</year><month>12</month><volume>100</volume><fpage>103311</fpage><pub-id pub-id-type="doi">10.1016/j.jbi.2019.103311</pub-id><pub-id pub-id-type="medline">31629922</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ngiam</surname><given-names>KY</given-names></name><name name-style="western"><surname>Khor</surname><given-names>IW</given-names></name></person-group><article-title>Big data and machine learning algorithms for health-care delivery</article-title><source>Lancet Oncol</source><year>2019</year><month>05</month><volume>20</volume><issue>5</issue><fpage>e262</fpage><lpage>e273</lpage><pub-id pub-id-type="doi">10.1016/S1470-2045(19)30149-4</pub-id><pub-id pub-id-type="medline">31044724</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="book"><person-group person-group-type="editor"><name name-style="western"><surname>Mechelli</surname><given-names>A</given-names></name><name name-style="western"><surname>Vieira</surname><given-names>S</given-names></name></person-group><source>Machine Learning: Methods and Applications to Brain Disorders, 1st Edition</source><year>2019</year><publisher-loc>San Deigo, CA</publisher-loc><publisher-name>Elsevier</publisher-name><comment>ISBN</comment><pub-id pub-id-type="other">9780128157398</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Graham</surname><given-names>S</given-names></name><name name-style="western"><surname>Depp</surname><given-names>C</given-names></name><name name-style="western"><surname>Lee</surname><given-names>EE</given-names></name><name name-style="western"><surname>Nebeker</surname><given-names>C</given-names></name><name name-style="western"><surname>Tu</surname><given-names>X</given-names></name><name name-style="western"><surname>Kim</surname><given-names>HC</given-names></name><etal/></person-group><article-title>Artificial intelligence for mental health and mental illnesses: an overview</article-title><source>Curr Psychiatry Rep</source><year>2019</year><month>11</month><day>7</day><volume>21</volume><issue>11</issue><fpage>116</fpage><pub-id pub-id-type="doi">10.1007/s11920-019-1094-0</pub-id><pub-id pub-id-type="medline">31701320</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hughes</surname><given-names>MC</given-names></name><name name-style="western"><surname>Pradier</surname><given-names>MF</given-names></name><name name-style="western"><surname>Ross</surname><given-names>AS</given-names></name><name name-style="western"><surname>McCoy</surname><given-names>TH Jr</given-names></name><name name-style="western"><surname>Perlis</surname><given-names>RH</given-names></name><name name-style="western"><surname>Doshi-Velez</surname><given-names>F</given-names></name></person-group><article-title>Assessment of a prediction model for antidepressant treatment stability using supervised topic models</article-title><source>JAMA Netw Open</source><year>2020</year><month>05</month><day>1</day><volume>3</volume><issue>5</issue><fpage>e205308</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2020.5308</pub-id><pub-id pub-id-type="medline">32432711</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xu</surname><given-names>Z</given-names></name><name name-style="western"><surname>Wang</surname><given-names>F</given-names></name><name name-style="western"><surname>Adekkanattu</surname><given-names>P</given-names></name><name name-style="western"><surname>Bose</surname><given-names>B</given-names></name><name name-style="western"><surname>Vekaria</surname><given-names>V</given-names></name><name name-style="western"><surname>Brandt</surname><given-names>P</given-names></name><etal/></person-group><article-title>Subphenotyping depression using machine learning and electronic health records</article-title><source>Learn Health Syst</source><year>2020</year><month>08</month><day>3</day><volume>4</volume><issue>4</issue><fpage>e10241</fpage><pub-id pub-id-type="doi">10.1002/lrh2.10241</pub-id><pub-id pub-id-type="medline">33083540</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pradier</surname><given-names>MF</given-names></name><name name-style="western"><surname>Hughes</surname><given-names>MC</given-names></name><name name-style="western"><surname>McCoy</surname><given-names>TH Jr</given-names></name><name name-style="western"><surname>Barroilhet</surname><given-names>SA</given-names></name><name name-style="western"><surname>Doshi-Velez</surname><given-names>F</given-names></name><name name-style="western"><surname>Perlis</surname><given-names>RH</given-names></name></person-group><article-title>Predicting change in diagnosis from major depression to bipolar disorder after antidepressant initiation</article-title><source>Neuropsychopharmacology</source><year>2021</year><month>01</month><volume>46</volume><issue>2</issue><fpage>455</fpage><lpage>461</lpage><pub-id pub-id-type="doi">10.1038/s41386-020-00838-x</pub-id><pub-id pub-id-type="medline">32927464</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Perlis</surname><given-names>RH</given-names></name><name name-style="western"><surname>Iosifescu</surname><given-names>DV</given-names></name><name name-style="western"><surname>Castro</surname><given-names>VM</given-names></name><name name-style="western"><surname>Murphy</surname><given-names>SN</given-names></name><name name-style="western"><surname>Gainer</surname><given-names>VS</given-names></name><name name-style="western"><surname>Minnier</surname><given-names>J</given-names></name><etal/></person-group><article-title>Using electronic medical records to enable large-scale studies in psychiatry: treatment resistant depression as a model</article-title><source>Psychol Med</source><year>2012</year><month>01</month><volume>42</volume><issue>1</issue><fpage>41</fpage><lpage>50</lpage><pub-id pub-id-type="doi">10.1017/S0033291711000997</pub-id><pub-id pub-id-type="medline">21682950</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>van der Lei</surname><given-names>J</given-names></name></person-group><article-title>Use and abuse of computer-stored medical records</article-title><source>Methods Inf Med</source><year>1991</year><month>04</month><volume>30</volume><issue>2</issue><fpage>79</fpage><lpage>80</lpage><pub-id pub-id-type="medline">1857252]</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Park</surname><given-names>HA</given-names></name><name name-style="western"><surname>Jung</surname><given-names>H</given-names></name><name name-style="western"><surname>On</surname><given-names>J</given-names></name><name name-style="western"><surname>Park</surname><given-names>SK</given-names></name><name name-style="western"><surname>Kang</surname><given-names>H</given-names></name></person-group><article-title>Digital epidemiology: use of digital data collected for non-epidemiological purposes in epidemiological studies</article-title><source>Healthc Inform Res</source><year>2018</year><month>10</month><volume>24</volume><issue>4</issue><fpage>253</fpage><lpage>262</lpage><pub-id pub-id-type="doi">10.4258/hir.2018.24.4.253</pub-id><pub-id pub-id-type="medline">30443413</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="web"><person-group person-group-type="author"><collab>Gazzetta Ufficiale</collab></person-group><article-title>Legge 22 Marzo 2019, n 29: Istituzione e disciplina della Rete nazionale dei registri dei tumori e dei sistemi di sorveglianza e del referto epidemiologico per il controllo sanitario della popolazione</article-title><year>2019</year><access-date>2023-07-4</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.gazzettaufficiale.it/eli/id/2019/04/05/19G00036/sg">www.gazzettaufficiale.it/eli/id/2019/04/05/19G00036/sg</ext-link></comment></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ferrannini</surname><given-names>L</given-names></name><name name-style="western"><surname>Ghio</surname><given-names>L</given-names></name><name name-style="western"><surname>Gibertoni</surname><given-names>D</given-names></name><name name-style="western"><surname>Lora</surname><given-names>A</given-names></name><name name-style="western"><surname>Tibaldi</surname><given-names>G</given-names></name><name name-style="western"><surname>Neri</surname><given-names>G</given-names></name><etal/></person-group><article-title>Thirty-five years of community psychiatry in Italy</article-title><source>J Nerv Ment Dis</source><year>2014</year><month>06</month><volume>202</volume><issue>6</issue><fpage>432</fpage><lpage>439</lpage><pub-id pub-id-type="doi">10.1097/NMD.0000000000000141</pub-id><pub-id pub-id-type="medline">24821278</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Barbui</surname><given-names>C</given-names></name><name name-style="western"><surname>Papola</surname><given-names>D</given-names></name><name name-style="western"><surname>Saraceno</surname><given-names>B</given-names></name></person-group><article-title>Forty years without mental hospitals in Italy</article-title><source>Int J Ment Health Syst</source><year>2018</year><month>07</month><day>31</day><volume>12</volume><fpage>43</fpage><pub-id pub-id-type="doi">10.1186/s13033-018-0223-1</pub-id><pub-id pub-id-type="medline">30079100</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mezzina</surname><given-names>R</given-names></name></person-group><article-title>Forty years of the law 180: the aspirations of a great reform, its successes and continuing need</article-title><source>Epidemiol Psychiatr Sci</source><year>2018</year><month>08</month><volume>27</volume><issue>4</issue><fpage>336</fpage><lpage>345</lpage><pub-id pub-id-type="doi">10.1017/S2045796018000070</pub-id><pub-id pub-id-type="medline">29506591</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="web"><person-group person-group-type="author"><collab>Gazzetta Ufficiale</collab></person-group><article-title>Decreto del Presidente Della Repubblica 1 Novembre 1999: Approvazione del Progetto Obiettivo &#x201C;Tutela salute Mentale 1998-2000&#x201D;</article-title><year>1999</year><access-date>2023-07-4</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.gazzettaufficiale.it/atto/serie_generale/caricaDettaglioAtto/originario?atto.dataPubblicazioneGazzetta=1999-11-22&#x0026;atto.codiceRedazionale=099A9917&#x0026;elenco30giorni=false">www.gazzettaufficiale.it/atto/serie_generale/caricaDettaglioAtto/originario?atto.dataPubblicazioneGazzetta=1999-11-22&#x0026;atto.codiceRedazionale=099A9917&#x0026;elenco30giorni=false</ext-link></comment></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ferrara</surname><given-names>M</given-names></name><name name-style="western"><surname>Tedeschini</surname><given-names>E</given-names></name><name name-style="western"><surname>Baccari</surname><given-names>F</given-names></name><name name-style="western"><surname>Musella</surname><given-names>V</given-names></name><name name-style="western"><surname>Vacca</surname><given-names>F</given-names></name><name name-style="western"><surname>Mazzi</surname><given-names>F</given-names></name><etal/></person-group><article-title>Early intervention service for first episode psychosis in Modena, Northern Italy: the first hundred cases</article-title><source>Early Interv Psychiatry</source><year>2019</year><month>08</month><volume>13</volume><issue>4</issue><fpage>1011</fpage><lpage>1017</lpage><pub-id pub-id-type="doi">10.1111/eip.12788</pub-id><pub-id pub-id-type="medline">30672134</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Murri</surname><given-names>MB</given-names></name><name name-style="western"><surname>Bertelli</surname><given-names>R</given-names></name><name name-style="western"><surname>Carozza</surname><given-names>P</given-names></name><name name-style="western"><surname>Berardi</surname><given-names>L</given-names></name><name name-style="western"><surname>Cantarelli</surname><given-names>L</given-names></name><name name-style="western"><surname>Croce</surname><given-names>E</given-names></name><etal/></person-group><article-title>First-episode psychosis in the Ferrara Mental Health Department: incidence and clinical course within the first 2&#x2009;years</article-title><source>Early Interv Psychiatry</source><year>2021</year><month>12</month><volume>15</volume><issue>6</issue><fpage>1738</fpage><lpage>1748</lpage><pub-id pub-id-type="doi">10.1111/eip.13095</pub-id><pub-id pub-id-type="medline">33264815</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Denney</surname><given-names>MJ</given-names></name><name name-style="western"><surname>Long</surname><given-names>DM</given-names></name><name name-style="western"><surname>Armistead</surname><given-names>MG</given-names></name><name name-style="western"><surname>Anderson</surname><given-names>JL</given-names></name><name name-style="western"><surname>Conway</surname><given-names>BN</given-names></name></person-group><article-title>Validating the extract, transform, load process used to populate a large clinical research database</article-title><source>Int J Med Inform</source><year>2016</year><month>10</month><volume>94</volume><fpage>271</fpage><lpage>274</lpage><pub-id pub-id-type="doi">10.1016/j.ijmedinf.2016.07.009</pub-id><pub-id pub-id-type="medline">27506144</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ralambondrainy</surname><given-names>H</given-names></name></person-group><article-title>A conceptual version of the K-means algorithm</article-title><source>Pattern Recognit Lett</source><year>1995</year><month>11</month><volume>16</volume><issue>11</issue><fpage>1147</fpage><lpage>1157</lpage><pub-id pub-id-type="doi">10.1016/0167-8655(95)00075-R</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Witten</surname><given-names>IH</given-names></name><name name-style="western"><surname>Frank</surname><given-names>E</given-names></name><name name-style="western"><surname>Hall</surname><given-names>MA</given-names></name><name name-style="western"><surname>Pal</surname><given-names>CJ</given-names></name></person-group><source>Data Mining: Practical Machine Learning Tools and Techniques, Fourth Edition</source><year>2016</year><publisher-loc>Burlington, MA</publisher-loc><publisher-name>Morgan Kaufmann Publishers Inc</publisher-name></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="book"><person-group person-group-type="author"><collab>World Health Organization</collab></person-group><source>International Classification of Diseases Ninth Revision: Basic Tabulation List With Alphabetic Index</source><year>1978</year><publisher-loc>Geneva, Switzerland</publisher-loc><publisher-name>World Health Organization</publisher-name></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="web"><person-group person-group-type="author"><collab>The Pandas development team</collab></person-group><article-title>pandas-dev/Pandas: Pandas 1.3.4</article-title><year>2021</year><access-date>2023-07-6</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://zenodo.org/record/5574486/export/hx">zenodo.org/record/5574486/export/hx</ext-link></comment></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>McKinney</surname><given-names>W</given-names></name></person-group><article-title>Data structures for statistical computing in Python</article-title><year>June 28 to July 3, 2010</year><conf-name>Presented at Proceedings of the 9th Python in Science Conference (SciPy 2010)</conf-name><conf-loc>Austin, Texas</conf-loc><fpage>56</fpage><lpage>61</lpage><pub-id pub-id-type="doi">10.25080/Majora-92bf1922-00a</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Leach</surname><given-names>PJ</given-names></name><name name-style="western"><surname>Salz</surname><given-names>R</given-names></name><name name-style="western"><surname>Mealling</surname><given-names>MH</given-names></name></person-group><article-title>A universally unique identifier (UUID) URN namespace</article-title><year>2005</year><access-date>2023-07-6</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://dl.acm.org/doi/pdf/10.17487/RFC4122">dl.acm.org/doi/pdf/10.17487/RFC4122</ext-link></comment></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Van Rossum</surname><given-names>G</given-names></name><name name-style="western"><surname>Drake</surname><given-names>FL</given-names></name></person-group><source>Python 3 Reference Manual</source><year>2009</year><publisher-loc>Scotts Valley, CA</publisher-loc><publisher-name>CreateSpace</publisher-name></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Schmidt</surname><given-names>M</given-names></name><name name-style="western"><surname>Schmidt</surname><given-names>SAJ</given-names></name><name name-style="western"><surname>Sandegaard</surname><given-names>JL</given-names></name><name name-style="western"><surname>Ehrenstein</surname><given-names>V</given-names></name><name name-style="western"><surname>Pedersen</surname><given-names>L</given-names></name><name name-style="western"><surname>S&#x00F8;rensen</surname><given-names>HT</given-names></name></person-group><article-title>The Danish National Patient Registry: a review of content, data quality, and research potential</article-title><source>Clin Epidemiol</source><year>2015</year><month>11</month><day>17</day><volume>7</volume><fpage>449</fpage><lpage>490</lpage><pub-id pub-id-type="doi">10.2147/CLEP.S91125</pub-id><pub-id pub-id-type="medline">26604824</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mors</surname><given-names>O</given-names></name><name name-style="western"><surname>Perto</surname><given-names>GP</given-names></name><name name-style="western"><surname>Mortensen</surname><given-names>PB</given-names></name></person-group><article-title>The Danish Psychiatric Central Research Register</article-title><source>Scand J Public Health</source><year>2011</year><month>07</month><volume>39</volume><issue>7 Suppl</issue><fpage>54</fpage><lpage>57</lpage><pub-id pub-id-type="doi">10.1177/1403494810395825</pub-id><pub-id pub-id-type="medline">21775352</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Laugesen</surname><given-names>K</given-names></name><name name-style="western"><surname>Ludvigsson</surname><given-names>JF</given-names></name><name name-style="western"><surname>Schmidt</surname><given-names>M</given-names></name><name name-style="western"><surname>Gissler</surname><given-names>M</given-names></name><name name-style="western"><surname>Valdimarsdottir</surname><given-names>UA</given-names></name><name name-style="western"><surname>Lunde</surname><given-names>A</given-names></name><etal/></person-group><article-title>Nordic health registry-based research: A review of health care systems and key registries</article-title><source>Clin Epidemiol</source><year>2021</year><month>07</month><day>19</day><volume>13</volume><fpage>533</fpage><lpage>554</lpage><pub-id pub-id-type="doi">10.2147/CLEP.S314959</pub-id><pub-id pub-id-type="medline">34321928</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rajkomar</surname><given-names>A</given-names></name><name name-style="western"><surname>Dean</surname><given-names>J</given-names></name><name name-style="western"><surname>Kohane</surname><given-names>I</given-names></name></person-group><article-title>Machine learning in medicine. Reply</article-title><source>N Engl J Med</source><year>2019</year><month>06</month><day>27</day><volume>380</volume><issue>26</issue><fpage>2589</fpage><lpage>2590</lpage><pub-id pub-id-type="doi">10.1056/NEJMc1906060</pub-id><pub-id pub-id-type="medline">31242381</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Vargas</surname><given-names>N</given-names></name><name name-style="western"><surname>Lebrun-Harris</surname><given-names>LA</given-names></name><name name-style="western"><surname>Weinberg</surname><given-names>J</given-names></name><name name-style="western"><surname>Dievler</surname><given-names>A</given-names></name><name name-style="western"><surname>Felix</surname><given-names>KL</given-names></name></person-group><article-title>Qualitative perspective on the learning health system: how the Community Health Applied Research Network paved the way for research in safety-net settings</article-title><source>Prog Community Health Partnersh</source><year>2018</year><volume>12</volume><issue>3</issue><fpage>329</fpage><lpage>339</lpage><pub-id pub-id-type="doi">10.1353/cpr.2018.0057</pub-id><pub-id pub-id-type="medline">30581176</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Squires</surname><given-names>JE</given-names></name><name name-style="western"><surname>Logan</surname><given-names>B</given-names></name><name name-style="western"><surname>Lorts</surname><given-names>A</given-names></name><name name-style="western"><surname>Haskell</surname><given-names>H</given-names></name><name name-style="western"><surname>Sisaithong</surname><given-names>K</given-names></name><name name-style="western"><surname>Pillari</surname><given-names>T</given-names></name><etal/></person-group><article-title>A learning health network for pediatric liver transplantation: inaugural meeting report from the Starzl Network for Excellence in Pediatric Transplantation</article-title><source>Pediatr Transplant</source><year>2019</year><month>09</month><volume>23</volume><issue>6</issue><fpage>e13528</fpage><pub-id pub-id-type="doi">10.1111/petr.13528</pub-id><pub-id pub-id-type="medline">31328841</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Marsolo</surname><given-names>K</given-names></name><name name-style="western"><surname>Margolis</surname><given-names>PA</given-names></name><name name-style="western"><surname>Forrest</surname><given-names>CB</given-names></name><name name-style="western"><surname>Colletti</surname><given-names>RB</given-names></name><name name-style="western"><surname>Hutton</surname><given-names>JJ</given-names></name></person-group><article-title>A digital architecture for a network-based learning health system: integrating chronic care management, quality improvement, and research</article-title><source>EGEMS (Wash DC)</source><year>2015</year><month>08</month><day>17</day><volume>3</volume><issue>1</issue><fpage>1168</fpage><pub-id pub-id-type="doi">10.13063/2327-9214.1168</pub-id><pub-id pub-id-type="medline">26357665</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Donisi</surname><given-names>V</given-names></name><name name-style="western"><surname>Jones</surname><given-names>J</given-names></name><name name-style="western"><surname>Pertile</surname><given-names>R</given-names></name><name name-style="western"><surname>Salazzari</surname><given-names>D</given-names></name><name name-style="western"><surname>Grigoletti</surname><given-names>L</given-names></name><name name-style="western"><surname>Tansella</surname><given-names>M</given-names></name><etal/></person-group><article-title>The difficult task of predicting the costs of community-based mental health care. A comprehensive case register study</article-title><source>Epidemiol Psychiatr Sci</source><year>2011</year><month>09</month><volume>20</volume><issue>3</issue><fpage>245</fpage><lpage>256</lpage><pub-id pub-id-type="doi">10.1017/s2045796011000473</pub-id><pub-id pub-id-type="medline">21922967</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Thornicroft</surname><given-names>G</given-names></name><name name-style="western"><surname>Bisoffi</surname><given-names>G</given-names></name><name name-style="western"><surname>De Salvia</surname><given-names>D</given-names></name><name name-style="western"><surname>Tansella</surname><given-names>M</given-names></name></person-group><article-title>Urban-rural differences in the associations between social deprivation and psychiatric service utilization in schizophrenia and all diagnoses: a case-register study in Northern Italy</article-title><source>Psychol Med</source><year>1993</year><month>05</month><volume>23</volume><issue>2</issue><fpage>487</fpage><lpage>496</lpage><pub-id pub-id-type="doi">10.1017/s0033291700028579</pub-id><pub-id pub-id-type="medline">8332662</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ferrara</surname><given-names>M</given-names></name><name name-style="western"><surname>Srihari</surname><given-names>VH</given-names></name></person-group><article-title>Early intervention for psychosis in the United States: Tailoring services to improve care for women</article-title><source>Psychiatr Serv</source><year>2021</year><month>01</month><day>1</day><volume>72</volume><issue>1</issue><fpage>5</fpage><lpage>6</lpage><pub-id pub-id-type="doi">10.1176/appi.ps.202000205</pub-id><pub-id pub-id-type="medline">32966169</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="web"><person-group person-group-type="author"><collab>Ministero della Salute</collab></person-group><article-title>Piano per l&#x2019;applicazione e la diffusione della Medicina di Genere</article-title><year>2019</year><access-date>2023-07-6</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.salute.gov.it/portale/donna/dettaglioPubblicazioniDonna.jsp?id=2860&#x0026;lingua=italiano">www.salute.gov.it/portale/donna/dettaglioPubblicazioniDonna.jsp?id=2860&#x0026;lingua=italiano</ext-link></comment></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Astbury</surname><given-names>J</given-names></name></person-group><article-title>Gender disparities in mental health</article-title><year>May 14-22, 2001</year><conf-name>Presented at Fifty-fourth World Health Assembly</conf-name><conf-loc>Geneva, Switzerland.</conf-loc></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Meisner</surname><given-names>J</given-names></name><name name-style="western"><surname>Rasmussen</surname><given-names>S</given-names></name><name name-style="western"><surname>Benros</surname><given-names>ME</given-names></name></person-group><article-title>Towards precision psychiatry utilizing large-scale multimodal data paving the way for improved prevention and treatment of mental disorders</article-title><source>Neuroscience Applied</source><year>2023</year><volume>2</volume><fpage>101017</fpage><pub-id pub-id-type="doi">10.1016/j.nsa.2022.101017</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Guaiana</surname><given-names>G</given-names></name><name name-style="western"><surname>O&#x2019;Reilly</surname><given-names>R</given-names></name><name name-style="western"><surname>Grassi</surname><given-names>L</given-names></name></person-group><article-title>A comparison of inpatient adult psychiatric services in Italy and Canada</article-title><source>Community Ment Health J</source><year>2019</year><month>01</month><volume>55</volume><issue>1</issue><fpage>51</fpage><lpage>56</lpage><pub-id pub-id-type="doi">10.1007/s10597-018-0283-3</pub-id><pub-id pub-id-type="medline">29725879</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Martinelli</surname><given-names>A</given-names></name><name name-style="western"><surname>Iozzino</surname><given-names>L</given-names></name><name name-style="western"><surname>Ruggeri</surname><given-names>M</given-names></name><name name-style="western"><surname>Marston</surname><given-names>L</given-names></name><name name-style="western"><surname>Killaspy</surname><given-names>H</given-names></name></person-group><article-title>Mental health supported accommodation services in England and in Italy: a comparison</article-title><source>Soc Psychiatry Psychiatr Epidemiol</source><year>2019</year><month>11</month><volume>54</volume><issue>11</issue><fpage>1419</fpage><lpage>1427</lpage><pub-id pub-id-type="doi">10.1007/s00127-019-01723-9</pub-id><pub-id pub-id-type="medline">31055632</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bird</surname><given-names>V</given-names></name><name name-style="western"><surname>Miglietta</surname><given-names>E</given-names></name><name name-style="western"><surname>Giacco</surname><given-names>D</given-names></name><name name-style="western"><surname>Bauer</surname><given-names>M</given-names></name><name name-style="western"><surname>Greenberg</surname><given-names>L</given-names></name><name name-style="western"><surname>Lorant</surname><given-names>V</given-names></name><etal/></person-group><article-title>Factors associated with satisfaction of inpatient psychiatric care: a cross country comparison</article-title><source>Psychol Med</source><year>2020</year><month>01</month><volume>50</volume><issue>2</issue><fpage>284</fpage><lpage>292</lpage><pub-id pub-id-type="doi">10.1017/S0033291719000011</pub-id><pub-id pub-id-type="medline">30696510</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Perera</surname><given-names>G</given-names></name><name name-style="western"><surname>Broadbent</surname><given-names>M</given-names></name><name name-style="western"><surname>Callard</surname><given-names>F</given-names></name><name name-style="western"><surname>Chang</surname><given-names>CK</given-names></name><name name-style="western"><surname>Downs</surname><given-names>J</given-names></name><name name-style="western"><surname>Dutta</surname><given-names>R</given-names></name><etal/></person-group><article-title>Cohort profile of the South London and Maudsley NHS Foundation Trust Biomedical Research Centre (slam BRC) Case Register: current status and recent enhancement of an electronic mental health record-derived data resource</article-title><source>BMJ Open</source><year>2016</year><month>03</month><day>1</day><volume>6</volume><issue>3</issue><fpage>e008721</fpage><pub-id pub-id-type="doi">10.1136/bmjopen-2015-008721</pub-id><pub-id pub-id-type="medline">26932138</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Werbeloff</surname><given-names>N</given-names></name><name name-style="western"><surname>Osborn</surname><given-names>DPJ</given-names></name><name name-style="western"><surname>Patel</surname><given-names>R</given-names></name><name name-style="western"><surname>Taylor</surname><given-names>M</given-names></name><name name-style="western"><surname>Stewart</surname><given-names>R</given-names></name><name name-style="western"><surname>Broadbent</surname><given-names>M</given-names></name><etal/></person-group><article-title>The Camden &#x0026; Islington Research Database: using electronic mental health records for research</article-title><source>PLoS One</source><year>2018</year><month>01</month><day>29</day><volume>13</volume><issue>1</issue><fpage>e0190703</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0190703</pub-id><pub-id pub-id-type="medline">29377897</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Andreoli</surname><given-names>RRV</given-names></name><name name-style="western"><surname>Cassano</surname><given-names>GB</given-names></name></person-group><source>DSM-IV-TR. Manuale diagnostico e statistico dei disturbi mentali. Text revision. ICD-10/ICD-9-CM. Classificazione parallela</source><year>2007</year><publisher-loc>Amsterdam, Netherlands</publisher-loc><publisher-name>Elsevier</publisher-name></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kang</surname><given-names>H</given-names></name></person-group><article-title>The prevention and handling of the missing data</article-title><source>Korean J Anesthesiol</source><year>2013</year><month>05</month><volume>64</volume><issue>5</issue><fpage>402</fpage><lpage>406</lpage><pub-id pub-id-type="doi">10.4097/kjae.2013.64.5.402</pub-id><pub-id pub-id-type="medline">23741561</pub-id></nlm-citation></ref><ref id="ref50"><label>50</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Makaba</surname><given-names>T</given-names></name><name name-style="western"><surname>Dogo</surname><given-names>E</given-names></name></person-group><article-title>A comparison of strategies for missing values in data on machine learning classification Algorithms</article-title><year>November 21-22, 2019</year><conf-name>Presented at 2019 International Multidisciplinary Information Technology and Engineering Conference (IMITEC)</conf-name><conf-loc>Vanderbijlpark, South Africa</conf-loc><fpage>1</fpage><lpage>7</lpage><pub-id pub-id-type="doi">10.1109/IMITEC45504.2019.9015889</pub-id></nlm-citation></ref><ref id="ref51"><label>51</label><nlm-citation citation-type="web"><article-title>Istat | Istituto Nazionale di Statistica</article-title><access-date>2020-04-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="http://www.istat.it">www.istat.it</ext-link></comment></nlm-citation></ref><ref id="ref52"><label>52</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Navarro</surname><given-names>CLA</given-names></name><name name-style="western"><surname>Damen</surname><given-names>JAA</given-names></name><name name-style="western"><surname>Takada</surname><given-names>T</given-names></name><name name-style="western"><surname>Nijman</surname><given-names>SWJ</given-names></name><name name-style="western"><surname>Dhiman</surname><given-names>P</given-names></name><name name-style="western"><surname>Ma</surname><given-names>J</given-names></name><etal/></person-group><article-title>Risk of bias in studies on prediction models developed using supervised machine learning techniques: systematic review</article-title><source>BMJ</source><year>2021</year><month>10</month><day>20</day><volume>375</volume><fpage>n2281</fpage><pub-id pub-id-type="doi">10.1136/bmj.n2281</pub-id></nlm-citation></ref><ref id="ref53"><label>53</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Moons</surname><given-names>KGM</given-names></name><name name-style="western"><surname>Donders</surname><given-names>ART</given-names></name><name name-style="western"><surname>Steyerberg</surname><given-names>EW</given-names></name><name name-style="western"><surname>Harrell</surname><given-names>FE</given-names></name></person-group><article-title>Penalized maximum likelihood estimation to directly adjust diagnostic and prognostic prediction models for overoptimism: a clinical example</article-title><source>J Clin Epidemiol</source><year>2004</year><month>12</month><volume>57</volume><issue>12</issue><fpage>1262</fpage><lpage>1270</lpage><pub-id pub-id-type="doi">10.1016/j.jclinepi.2004.01.020</pub-id><pub-id pub-id-type="medline">15617952</pub-id></nlm-citation></ref><ref id="ref54"><label>54</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Franceschini</surname><given-names>A</given-names></name><name name-style="western"><surname>Fattore</surname><given-names>L</given-names></name></person-group><article-title>Gender-specific approach in psychiatric diseases: because sex matters</article-title><source>Eur J Pharmacol</source><year>2021</year><month>04</month><day>5</day><volume>896</volume><fpage>173895</fpage><pub-id pub-id-type="doi">10.1016/j.ejphar.2021.173895</pub-id><pub-id pub-id-type="medline">33508283</pub-id></nlm-citation></ref><ref id="ref55"><label>55</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Heinssen</surname><given-names>RK</given-names></name><collab>National Institute of Mental Health</collab></person-group><article-title>Early Psychosis Intervention Network (EPINET): a learning healthcare system for early serious mental illness</article-title><year>2015</year><access-date>2023-07-6</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.nimh.nih.gov/funding/grant-writing-and-application-process/concept-clearances/2015/early-psychosis-intervention-network-epinet-a-learning-healthcare-system-for-early-serious-mental-illness">www.nimh.nih.gov/funding/grant-writing-and-application-process/concept-clearances/2015/early-psychosis-intervention-network-epinet-a-learning-healthcare-system-for-early-serious-mental-illness</ext-link></comment></nlm-citation></ref><ref id="ref56"><label>56</label><nlm-citation citation-type="web"><article-title>STEP Learning Collaborative</article-title><access-date>2023-07-21</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.ctearlypsychosisnetwork.org/">www.ctearlypsychosisnetwork.org/</ext-link></comment></nlm-citation></ref><ref id="ref57"><label>57</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Srihari</surname><given-names>VH</given-names></name><name name-style="western"><surname>Ferrara</surname><given-names>M</given-names></name><name name-style="western"><surname>Li</surname><given-names>F</given-names></name><name name-style="western"><surname>Kline</surname><given-names>E</given-names></name><name name-style="western"><surname>G&#x00FC;l&#x00F6;ks&#x00FC;z</surname><given-names>S</given-names></name><name name-style="western"><surname>Pollard</surname><given-names>JM</given-names></name><etal/></person-group><article-title>Reducing the duration of untreated psychosis (DUP) in a US community: a quasi-experimental trial</article-title><source>Schizophr Bull Open</source><year>2022</year><month>01</month><day>4</day><volume>3</volume><issue>1</issue><fpage>sgab057</fpage><pub-id pub-id-type="doi">10.1093/schizbullopen/sgab057</pub-id><pub-id pub-id-type="medline">35295656</pub-id></nlm-citation></ref><ref id="ref58"><label>58</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Grassi</surname><given-names>L</given-names></name><name name-style="western"><surname>Stivanello</surname><given-names>E</given-names></name><name name-style="western"><surname>Murri</surname><given-names>MB</given-names></name><name name-style="western"><surname>Perlangeli</surname><given-names>V</given-names></name><name name-style="western"><surname>Pandolfi</surname><given-names>P</given-names></name><name name-style="western"><surname>Carnevali</surname><given-names>F</given-names></name><etal/></person-group><article-title>Mortality from cancer in people with severe mental disorders in Emilia Romagna Region, Italy</article-title><source>Psychooncology</source><year>2021</year><month>12</month><volume>30</volume><issue>12</issue><fpage>2039</fpage><lpage>2051</lpage><pub-id pub-id-type="doi">10.1002/pon.5805</pub-id><pub-id pub-id-type="medline">34499790</pub-id></nlm-citation></ref><ref id="ref59"><label>59</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pollard</surname><given-names>JM</given-names></name><name name-style="western"><surname>Ferrara</surname><given-names>M</given-names></name><name name-style="western"><surname>Lin</surname><given-names>IH</given-names></name><name name-style="western"><surname>Kucukgoncu</surname><given-names>S</given-names></name><name name-style="western"><surname>Wasser</surname><given-names>T</given-names></name><name name-style="western"><surname>Li</surname><given-names>F</given-names></name><etal/></person-group><article-title>Analysis of early intervention services on adult judicial outcomes</article-title><source>JAMA Psychiatry</source><year>2020</year><month>08</month><day>1</day><volume>77</volume><issue>8</issue><fpage>871</fpage><lpage>872</lpage><pub-id pub-id-type="doi">10.1001/jamapsychiatry.2020.0448</pub-id><pub-id pub-id-type="medline">32320010</pub-id></nlm-citation></ref><ref id="ref60"><label>60</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ferrara</surname><given-names>M</given-names></name><name name-style="western"><surname>Franchini</surname><given-names>G</given-names></name><name name-style="western"><surname>Funaro</surname><given-names>M</given-names></name><name name-style="western"><surname>Cutroni</surname><given-names>M</given-names></name><name name-style="western"><surname>Valier</surname><given-names>B</given-names></name><name name-style="western"><surname>Toffanin</surname><given-names>T</given-names></name><etal/></person-group><article-title>Machine learning and non-affective psychosis: identification, differential diagnosis, and treatment</article-title><source>Curr Psychiatry Rep</source><year>2022</year><month>12</month><volume>24</volume><issue>12</issue><fpage>925</fpage><lpage>936</lpage><pub-id pub-id-type="doi">10.1007/s11920-022-01399-0</pub-id><pub-id pub-id-type="medline">36399236</pub-id></nlm-citation></ref><ref id="ref61"><label>61</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Ferrara</surname><given-names>M</given-names></name><name name-style="western"><surname>Franchini</surname><given-names>G</given-names></name><name name-style="western"><surname>Funaro</surname><given-names>M</given-names></name><name name-style="western"><surname>Murri</surname><given-names>MB</given-names></name><name name-style="western"><surname>Toffanin</surname><given-names>T</given-names></name><name name-style="western"><surname>Zerbinati</surname><given-names>L</given-names></name><etal/></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Sousa</surname><given-names>MJ</given-names></name><name name-style="western"><surname>Pani</surname><given-names>S</given-names></name><name name-style="western"><surname>dal Mas</surname><given-names>F</given-names></name><name name-style="western"><surname>Sousa</surname><given-names>S</given-names></name></person-group><article-title>Machine learning for mental health: focus on affective and non-affective psychosis</article-title><source>Incorporating AI Technology in the Service Sector: Innovations in Creating Knowledge, Improving Efficiency, and Elevating Quality of Life</source><year>2023</year><publisher-loc>Palm Bay, FL</publisher-loc><publisher-name>Apple Academic Press Inc</publisher-name></nlm-citation></ref><ref id="ref62"><label>62</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Lipton</surname><given-names>ZC</given-names></name><name name-style="western"><surname>Kale</surname><given-names>DC</given-names></name><name name-style="western"><surname>Elkan</surname><given-names>C</given-names></name><name name-style="western"><surname>Wetzel</surname><given-names>R</given-names></name></person-group><article-title>Learning to diagnose with LSTM recurrent neural networks</article-title><source>arXiv. Preprint posted online on November 11, 2015</source><pub-id pub-id-type="doi">1511.03677</pub-id></nlm-citation></ref><ref id="ref63"><label>63</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Che</surname><given-names>Z</given-names></name><name name-style="western"><surname>Purushotham</surname><given-names>S</given-names></name><name name-style="western"><surname>Cho</surname><given-names>K</given-names></name><name name-style="western"><surname>Sontag</surname><given-names>D</given-names></name><name name-style="western"><surname>Liu</surname><given-names>Y</given-names></name></person-group><article-title>Recurrent neural networks for multivariate time series with missing values</article-title><source>Sci Rep</source><year>2018</year><month>04</month><day>17</day><volume>8</volume><issue>1</issue><fpage>6085</fpage><pub-id pub-id-type="doi">10.1038/s41598-018-24271-9</pub-id><pub-id pub-id-type="medline">29666385</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Characteristics of the records within the tables of the Ferrara-Psychiatry (FEPSY) database.</p><media xlink:href="medinform_v11i1e45523_app1.docx" xlink:title="DOCX File, 17 KB"/></supplementary-material></app-group></back></article>