<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Artif. Intell.</journal-id>
<journal-title>Frontiers in Artificial Intelligence</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Artif. Intell.</abbrev-journal-title>
<issn pub-type="epub">2624-8212</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/frai.2023.1187501</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Artificial Intelligence</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Assessing longitudinal housing status using Electronic Health Record data: a comparison of natural language processing, structured data, and patient-reported history</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name><surname>Chapman</surname> <given-names>Alec B.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1514746/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Cordasco</surname> <given-names>Kristina</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Chassman</surname> <given-names>Stephanie</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Panadero</surname> <given-names>Talia</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/2249641/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Agans</surname> <given-names>Dylan</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff7"><sup>7</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Jackson</surname> <given-names>Nicholas</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff8"><sup>8</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Clair</surname> <given-names>Kimberly</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Nelson</surname> <given-names>Richard</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Montgomery</surname> <given-names>Ann Elizabeth</given-names></name>
<xref ref-type="aff" rid="aff9"><sup>9</sup></xref>
<xref ref-type="aff" rid="aff10"><sup>10</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/714858/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Tsai</surname> <given-names>Jack</given-names></name>
<xref ref-type="aff" rid="aff11"><sup>11</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Finley</surname> <given-names>Erin</given-names></name>
<xref ref-type="aff" rid="aff9"><sup>9</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/558551/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Gabrielian</surname> <given-names>Sonya</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff12"><sup>12</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1857059/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Informatics, Decision-Enhancement and Analytic Sciences (IDEAS) Center, Salt Lake City Veterans Affairs Healthcare System</institution>, <addr-line>Salt Lake City, UT</addr-line>, <country>United States</country></aff>
<aff id="aff2"><sup>2</sup><institution>Division of Epidemiology, University of Utah, School of Medicine</institution>, <addr-line>Salt Lake City, UT</addr-line>, <country>United States</country></aff>
<aff id="aff3"><sup>3</sup><institution>Center for the Study of Healthcare Innovation, Implementation and Policy (CSHIIP), Greater Los Angeles Veterans Affairs Healthcare System</institution>, <addr-line>Los Angeles, CA</addr-line>, <country>United States</country></aff>
<aff id="aff4"><sup>4</sup><institution>Department of Medicine, David Geffen School of Medicine, University of California, Los Angeles</institution>, <addr-line>Los Angeles, CA</addr-line>, <country>United States</country></aff>
<aff id="aff5"><sup>5</sup><institution>Desert Pacific Mental Illness Research, Education, and Clinical Center (MIRECC), Veterans Affairs Greater Los Angeles</institution>, <addr-line>Los Angeles, CA</addr-line>, <country>United States</country></aff>
<aff id="aff6"><sup>6</sup><institution>Department of Epidemiology, Fielding School of Public Health, University of California, Los Angeles</institution>, <addr-line>Los Angeles, CA</addr-line>, <country>United States</country></aff>
<aff id="aff7"><sup>7</sup><institution>Department of Community Health Sciences, Fielding School of Public Health, University of California, Los Angeles</institution>, <addr-line>Los Angeles, CA</addr-line>, <country>United States</country></aff>
<aff id="aff8"><sup>8</sup><institution>Department of Medicine Statistics Core, David Geffen School of Medicine, University of California, Los Angeles</institution>, <addr-line>Los Angeles, CA</addr-line>, <country>United States</country></aff>
<aff id="aff9"><sup>9</sup><institution>United States Department of Veteran Affairs, Birmingham Veterans Affairs Health Care System</institution>, <addr-line>Birmingham, AL</addr-line>, <country>United States</country></aff>
<aff id="aff10"><sup>10</sup><institution>School of Public Health, University of Alabama at Birmingham</institution>, <addr-line>Birmingham, AL</addr-line>, <country>United States</country></aff>
<aff id="aff11"><sup>11</sup><institution>National Homeless Programs Office, United States Department of Veterans Affairs</institution>, <addr-line>Washington, DC</addr-line>, <country>United States</country></aff>
<aff id="aff12"><sup>12</sup><institution>Department of Psychiatry and Biobehavioral Sciences, David Geffen School of Medicine, University of California, Los Angeles</institution>, <addr-line>Los Angeles, CA</addr-line>, <country>United States</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Jo&#x000E3;o Gama Marques, Centro Hospitalar Psiqui&#x000E1;trico de Lisboa, Portugal</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Lirong Wang, University of Pittsburgh, United States; Mike Conway, The University of Utah, United States</p></fn>
<corresp id="c001">&#x0002A;Correspondence: Alec B. Chapman <email>alec.chapman&#x00040;hsc.utah.edu</email></corresp>
</author-notes>
<pub-date pub-type="epub">
<day>24</day>
<month>05</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>6</volume>
<elocation-id>1187501</elocation-id>
<history>
<date date-type="received">
<day>22</day>
<month>03</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>05</day>
<month>05</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2023 Chapman, Cordasco, Chassman, Panadero, Agans, Jackson, Clair, Nelson, Montgomery, Tsai, Finley and Gabrielian.</copyright-statement>
<copyright-year>2023</copyright-year>
<copyright-holder>Chapman, Cordasco, Chassman, Panadero, Agans, Jackson, Clair, Nelson, Montgomery, Tsai, Finley and Gabrielian</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<sec>
<title>Introduction</title>
<p>Measuring long-term housing outcomes is important for evaluating the impacts of services for individuals with homeless experience. However, assessing long-term housing status using traditional methods is challenging. The Veterans Affairs (VA) Electronic Health Record (EHR) provides detailed data for a large population of patients with homeless experiences and contains several indicators of housing instability, including structured data elements (e.g., diagnosis codes) and free-text clinical narratives. However, the validity of each of these data elements for measuring housing stability over time is not well-studied.</p>
</sec>
<sec>
<title>Methods</title>
<p>We compared VA EHR indicators of housing instability, including information extracted from clinical notes using natural language processing (NLP), with patient-reported housing outcomes in a cohort of homeless-experienced Veterans.</p>
</sec>
<sec>
<title>Results</title>
<p>NLP achieved higher sensitivity and specificity than standard diagnosis codes for detecting episodes of unstable housing. Other structured data elements in the VA EHR showed promising performance, particularly when combined with NLP.</p>
</sec>
<sec>
<title>Discussion</title>
<p>Evaluation efforts and research studies assessing longitudinal housing outcomes should incorporate multiple data sources of documentation to achieve optimal performance.</p>
</sec>
</abstract>
<kwd-group>
<kwd>homelessness</kwd>
<kwd>electronic health records</kwd>
<kwd>natural language processing</kwd>
<kwd>veterans affairs</kwd>
<kwd>social determinants of health</kwd>
</kwd-group>
<contract-num rid="cn001">21-285</contract-num>
<contract-sponsor id="cn001">Quality Enhancement Research Initiative<named-content content-type="fundref-id">10.13039/100007181</named-content></contract-sponsor>
<counts>
<fig-count count="2"/>
<table-count count="4"/>
<equation-count count="0"/>
<ref-count count="25"/>
<page-count count="10"/>
<word-count count="7651"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Medicine and Public Health</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1. Introduction</title>
<p>Social determinants of health (SDoH) significantly impact patients&#x00027; health and quality of life. Housing status is a key SDoH and ending homelessness among United States Veterans is a national priority for the Department of Veterans Affairs (VA), which provides a breadth of health and housing services for homeless-experienced Veterans (HEVs). To evaluate the effectiveness of VA homeless services, assessing short- and long-term housing outcomes is essential. However, to date, most studies that assess housing outcomes require collecting repeated patient-reported measures of housing status, which are costly and challenging to obtain.</p>
<p>In VA and other integrated healthcare systems, the Electronic Health Record (EHR) is a potentially valuable source of data regarding longitudinal housing outcomes. However, using EHR data for this purpose is challenging due to measurement error, missing data, and other complexities (Botsis et al., <xref ref-type="bibr" rid="B2">2010</xref>; Wells et al., <xref ref-type="bibr" rid="B25">2013</xref>; Glicksberg et al., <xref ref-type="bibr" rid="B8">2018</xref>) which can bias outcomes assessed using longitudinal analyses (Lin et al., <xref ref-type="bibr" rid="B13">2004</xref>; Pullenayegum and Lim, <xref ref-type="bibr" rid="B21">2016</xref>; Lokku et al., <xref ref-type="bibr" rid="B14">2021</xref>). SDoH are often recorded in the EHR using free-text clinical narratives (Organization, <xref ref-type="bibr" rid="B19">2004</xref>; Gundlapalli et al., <xref ref-type="bibr" rid="B9">2013</xref>, <xref ref-type="bibr" rid="B10">2015</xref>; Peterson and Gundlapalli, <xref ref-type="bibr" rid="B20">2015</xref>; Conway et al., <xref ref-type="bibr" rid="B5">2019</xref>; Chapman et al., <xref ref-type="bibr" rid="B4">2021</xref>; Hatef et al., <xref ref-type="bibr" rid="B11">2022</xref>; Lybarger and Yetisgen, <xref ref-type="bibr" rid="B15">2023</xref>; Tsai et al., <xref ref-type="bibr" rid="B23">2022</xref>), and several studies have developed methods for extracting housing data from clinical texts (Gundlapalli et al., <xref ref-type="bibr" rid="B9">2013</xref>; Conway et al., <xref ref-type="bibr" rid="B5">2019</xref>; Chapman et al., <xref ref-type="bibr" rid="B4">2021</xref>; Hatef et al., <xref ref-type="bibr" rid="B11">2022</xref>; Lybarger and Yetisgen, <xref ref-type="bibr" rid="B15">2023</xref>). In VA, one such system is Relative Housing Stability in Electronic Documentation (ReHouSED) (Chapman et al., <xref ref-type="bibr" rid="B4">2021</xref>), a Natural Language Processing (NLP) system developed to extract housing stability from the EHR to evaluate VA&#x00027;s homelessness prevention and rapid rehousing program. ReHouSED demonstrated higher validity for identifying homeless status compared to International Classification of Diseases 10<sup>th</sup> Edition (ICD-10) codes, a set of standardized codes representing clinical diagnoses and symptoms published by the World Health Organization (Organization, <xref ref-type="bibr" rid="B19">2004</xref>).</p>
<p>However, there are several challenges in applying ReHouSED to study housing outcomes. First, the system may need to be adjusted for particular patient cohorts or evaluating specific services. It was originally designed for HEVs engaged in a rapid rehousing program; HEVs enrolled in other homeless services may have different EHR note structures or linguistic patterns. Second, missing data may cause bias when using ReHouSED for measuring outcomes. Information is only recorded in the EHR when patients present for care, which may occur more frequently for some patients than others. This produces observations at highly irregular intervals rather than the fixed, regularly spaced assessments that are ideal for longitudinal data collection, which can lead to biased analyses unless methods account for missing data (Pullenayegum and Lim, <xref ref-type="bibr" rid="B21">2016</xref>; Lokku et al., <xref ref-type="bibr" rid="B14">2021</xref>). Third, measurement error is ubiquitous in studies that use EHR data, particularly when using NLP to extract information from complex free text. While NLP is often designed to improve upon the shortcomings of structured data, misclassification is still present. This is especially true for complex variables such as longitudinal housing outcomes.</p>
<p>In the rapid rehousing context, ReHouSED achieved moderate accuracy (average positive predictive value and sensitivity of 65.3 and 68.1, respectively) and expert annotators achieved modest inter-annotator agreement (Cohen&#x00027;s Kappa = 0.7) (Chapman et al., <xref ref-type="bibr" rid="B4">2021</xref>), demonstrating the complexity of the task. The accuracy of housing status classification can potentially be improved by combining NLP classifications with other EHR variables (e.g., ICD-10 codes) (Gundlapalli et al., <xref ref-type="bibr" rid="B10">2015</xref>; Peterson and Gundlapalli, <xref ref-type="bibr" rid="B20">2015</xref>; Wang et al., <xref ref-type="bibr" rid="B24">2016</xref>; Nelson et al., <xref ref-type="bibr" rid="B18">2018</xref>; Tsai et al., <xref ref-type="bibr" rid="B23">2022</xref>). However, the accuracy of these data elements, as well as the best combination of indices, is not well-studied, in part due to the challenge of constructing a reference standard.</p>
<p>We aimed to develop a &#x0201C;best practice&#x0201D; for assessing longitudinal housing instability using observational EHR data as part of a quality improvement initiative targeting VA&#x00027;s Grant and Per Diem (GPD) case management aftercare program (hereafter, &#x0201C;Aftercare&#x0201D;). In this program, VA partners with community-based homeless service agencies to provide 6 months of case management for HEVs undergoing housing transitions (e.g., from institutional settings to independent housing). For a cohort of Aftercare patients in Southern California, we collected patient-reported housing history for a 2-year period. We then extracted six indicators of housing instability from the VA EHR: clinical note classifications of housing status obtained using ReHouSED tailored for this cohort (Chapman et al., <xref ref-type="bibr" rid="B4">2021</xref>); ICD-10 codes for homelessness; notations of homeless service use found in outpatient visits; inpatient admissions associated with homelessness (e.g., residential treatment programs); a universal screening tool to assess housing instability; and data from VA&#x00027;s homeless registry. We compare the validity of each indicator of housing instability, considering the patient-reported data as a gold standard, and discuss implications for evaluations of housing interventions.</p>
</sec>
<sec id="s2">
<title>2. Materials and methods</title>
<sec>
<title>2.1. Setting and ethics</title>
<p>Our cohort consisted of 386 VA Greater Los Angeles patients who engaged in Aftercare between 10/1/2019 and 1/4/2021. This cohort was enrolled in a parent project evaluating the implementation of Critical Time Intervention, an evidence-based, structured, and time-limited case management practice (Herman et al., <xref ref-type="bibr" rid="B12">2000</xref>; Gabrielian et al., <xref ref-type="bibr" rid="B7">2022</xref>). All project activities were reviewed by VA&#x00027;s Central Institutional Review Board and designated as quality improvement.</p>
<p>We extracted patient demographics for the entire cohort including age, race, and ethnicity from administrative data collected as part of Aftercare. Additionally, we identified recent diagnoses of psychiatric and substance use disorders using ICD-10 diagnosis codes derived from the VA&#x00027;s National Psychosis Registry (Blow et al., <xref ref-type="bibr" rid="B1">2004</xref>). We included the following conditions in our analysis: alcohol use disorders; drug use disorders; schizophrenia spectrum and other psychotic disorders; bipolar disorders; major depressive disorder; anxiety disorders; and post-traumatic stress disorders. The complete list of ICD-10 codes can be found in the <xref ref-type="supplementary-material" rid="SM1">Supplementary material</xref>. Of note, we did not assess for the presence of dementia or other major neurocognitive disorders (exclusion criteria from the housing program in which this cohort was engaged); mental retardation (which is incompatible with military service); or personality disorders (which are inaccurately captured in VA administrative data). Diagnosis codes were retrieved from outpatient and inpatient settings in the year preceding the patient lookback period (defined in the following paragraph).</p>
</sec>
<sec>
<title>2.2. Patient-reported housing outcomes</title>
<p>We recruited a random subsample of 61 patients from the cohort for detailed telephone assessments of their housing status from 7/1/2020 and 6/30/2022. The goal was to create a reference standard to enable refinement of EHR methodologies for assessing housing status. We sent recruitment letters to 188 randomly selected Veterans, 19 of whom opted into the study. 158 of the remaining Veterans received follow-up recruitment calls and 41 volunteered to participate.</p>
<p>Following verbal informed consent, assessments were conducted with the Residential Time-Line Follow Back (TLFB) inventory, a validated instrument that collects retrospective housing status (Mendelson et al., <xref ref-type="bibr" rid="B16">2010</xref>). The TLFB assigns codes for 34 different housing types (e.g., &#x0201C;On the street or in other outdoor place,&#x0201D; &#x0201C;Own apartment or house&#x0201D;) and classifies each type to one of four categories: &#x0201C;Literal Homelessness,&#x0201D; &#x0201C;Temporary,&#x0201D; &#x0201C;Stable,&#x0201D; and &#x0201C;Institutional.&#x0201D; In these analyses, we collapsed &#x0201C;Literal Homelessness&#x0201D; and &#x0201C;Temporary Housing&#x0201D; into a single &#x0201C;Unstable&#x0201D; category. Except for inpatient admissions coded as &#x0201C;Hospital (medical only),&#x0201D; any &#x0201C;Institutional&#x0201D; code was also considered to be &#x0201C;Unstable.&#x0201D; This meant that short-term institutional facilities, such as residential programs or crisis housing, were considered unstable.</p>
<p>Using standardized TLFB procedures, participants reported all changes in housing status over the specified period. We defined patient episodes as a continuous period spent &#x0201C;stable&#x0201D; or &#x0201C;unstable.&#x0201D; For example, patients who were stably housed during the entire period had a single episode (even if they changed addresses or moved to a different subcategory of stable housing), whereas a patient who was stably housed at the beginning of the period but then became unstably housed for the rest of the period had two episodes.</p>
</sec>
<sec>
<title>2.3. EHR indicators of housing status</title>
<p>EHR data for all patients in this subsample was obtained from VA&#x00027;s Corporate Data Warehouse (CDW), a national repository of demographics, diagnoses, clinical narratives, and other clinical and administrative data. Additional data was retrieved from the VA&#x00027;s homeless service registry and linked to CDW data.</p>
<sec>
<title>2.3.1. NLP system</title>
<p>We used ReHouSED to extract housing status from clinical notes in the subset of patients who completed telephone interviews (Chapman et al., <xref ref-type="bibr" rid="B4">2021</xref>). ReHouSED is a rule-based system implemented in medspaCy (Eyre et al., <xref ref-type="bibr" rid="B6">2021</xref>) that was originally developed to extract housing outcomes from HEVs participating in VA&#x00027;s rapid rehousing program. Rules are hand-crafted to define semantic phrase and syntactic patterns, matching entities related to homelessness (e.g., &#x0201C;sleeps in the park,&#x0201D; &#x0201C;needs shelter&#x0201D;) and housing stability (e.g., &#x0201C;lives in an apartment,&#x0201D; &#x0201C;no concerns about housing&#x0201C;). Each entity is then linked to any linguistic modifiers such as phrases indicating negation (e.g., &#x0201C;not currently&#x0201D;) or risk (e.g., &#x0201C;worried about being evicted&#x0201D;). Notes are also parsed to identify the clinical note sections, such as past medical history or social history. This contextual information is used to interpret whether each entity is referring to the patient&#x00027;s current housing status and whether they are stably housed. Based on text in a note, each note is assigned one of three housing status classifications: &#x0201C;Stable,&#x0201D; &#x0201C;Unstable,&#x0201D; or &#x0201C;Unknown.&#x0201D; The last of these classifications refers to notes that include some mention of housing or discussion of a patient&#x00027;s history of housing instability but have no discernible statement of the patient&#x00027;s current housing status. Examples of documents classified as &#x0201C;Unstable&#x0201D; and &#x0201C;Stable,&#x0201D; respectively, are shown in <xref ref-type="fig" rid="F1">Figure 1</xref>.</p>
<fig id="F1" position="float">
<label>Figure 1</label>
<caption><p><bold>(A)</bold> A clinical note classified by ReHouSED as &#x0201C;Unstable.&#x0201D; The note states that the patient is living in a hotel and hopes to move into stable housing soon. HUD-VASH, HUD-Veterans Affairs Supportive Housing. <bold>(B)</bold> A clinical note classified by ReHouSED as &#x0201C;Stable.&#x0201D; The note mentions the patient&#x00027;s history of living in unstable housing but states that the patient is currently stably housed.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frai-06-1187501-g0001.tif"/>
</fig>
<p>Using a random sample of 250 notes from the larger cohort (<italic>n</italic> = 386), we tailored ReHouSED to fit housing outcome classifications pertinent to Aftercare. First, we identified clinical note templates and phrases related to the receipt of VA permanent supportive housing services (independent housing with financial subsidies and supportive services). Though ReHouSED initially classified permanent supportive housing as &#x0201C;Unstable,&#x0201D; we conceptualized permanent supportive housing as a positive (&#x0201C;Stable&#x0201D;) outcome for Aftercare patients. Second, while ReHouSED prioritized mentions of stable housing over mentions of homelessness or temporary housing in a clinical note, we modified the document classification logic to prioritize current mentions of VA&#x00027;s residential treatment program for HEVs (known as the Domiciliary); for HEVs engaged in Aftercare, enrollment in residential treatment was considered a negative (&#x0201C;Unstable&#x0201D;) outcome. Last, based on a review of this sample of notes, we added a small number of additional concepts that were not included in the original ReHouSED system (e.g., &#x0201C;currently incarcerated,&#x0201D; &#x0201C;sober home&#x0201D;).</p>
<p>We processed all notes mentioning housing keywords for interviewed patients during the 2-year assessment period. The housing keywords and additional exclusion criteria are the same as those described by Chapman et al. (<xref ref-type="bibr" rid="B4">2021</xref>). If multiple notes mentioning housing were present on a single day, we classified the encounter as &#x0201C;Unstable&#x0201D; if at least half of the notes were classified as &#x0201C;Unstable&#x0201D; after excluding &#x0201C;Unknown&#x0201D; notes. If fewer than half were classified as &#x0201C;Unstable,&#x0201D; or if there were no notes classified as &#x0201C;Stable&#x0201D; or &#x0201C;Unstable,&#x0201D; the housing status that day was deemed &#x0201C;Stable.&#x0201D;</p>
</sec>
<sec>
<title>2.3.2. Structured EHR data</title>
<p>We abstracted demographic data (age, gender, race, ethnicity) from the EHR. We also obtained structured EHR data elements that indicate housing instability: ICD-10 codes for behavioral health disorders (psychiatric diagnoses and substance use disorders); outpatient administrative data that indicate receipt of homeless services; inpatient administrative data that describe admission to programs for HEVs; and a homelessness screening tool. Each data element is detailed below. Specific value sets for each data element are provided in the <xref ref-type="supplementary-material" rid="SM1">Supplemental material</xref>.</p>
<p><italic>ICD-10 codes:</italic> Several ICD-10 codes associated with outpatient visits or inpatient care indicate homelessness or risk of homelessness (e.g., &#x0201C;Z59.0: Homelessness, unspecified&#x0201D;). We retrieved all ICD-10 codes pertaining to homelessness or risk of homelessness during the study period. We conceptualized a patient as unstable if there was a homeless-associated ICD-10 code on a given day.</p>
<p>Outpatient administrative data: In VA EHR, the type of outpatient clinical service is coded. We identified codes indicating use of VA homeless services and considered an encounter unstable if the Veteran received care from any of these services.</p>
<p>Inpatient administrative: For all hospital stays in the study cohort, we identified residential treatment programs for HEVs (conceptualized as inpatient admissions in VA, e.g., the &#x0201C;Domiciliary Care for Homeless Veterans (DCHV) program&#x0201D;).</p>
<p>Homelessness screener: The Homelessness Screening Clinical Reminder (HSCR) is an instrument delivered to all Veteran outpatients to routinely screen for recent housing instability or risk of housing instability (Montgomery et al., <xref ref-type="bibr" rid="B17">2022</xref>). Responses to this screener are saved in the EHR as structured data elements. We identified positive responses from interviewed Veterans.</p>
</sec>
<sec>
<title>2.3.3. Homeless service registry data</title>
<p>The VA maintains an administrative database of homeless services provided to Veterans by the VA or its community partners, referred to as the homeless service registry (HOMES). We queried this database for enrollment and exit dates into housing assistance programs and considered patients to be unstably housed during their enrollment period.</p>
</sec>
</sec>
<sec>
<title>2.4. Analyses</title>
<sec>
<title>2.4.1. TLFB data</title>
<p>Using TLFB data, we calculated the count, percent of episodes, and total person-days spent in each of three categories: unstable, stable, and institutional. Because days spent in institutional settings (e.g., hospital admissions not related directly to homelessness) were expected to be uncommon and captured using inpatient administrative data, episodes assigned to this category were excluded from further analyses. We also derived a binary variable indicator whether the patient reported housing instability at any point in the 2-year assessment period. We measured the association between housing instability at any point with baseline characteristics (i.e., demographic variables and psychiatric diagnoses) using a logistic regression model.</p>
</sec>
<sec>
<title>2.4.2. VA service use frequency and type</title>
<p>Analyses using EHR data depend on documentation of patients&#x00027; service use, leading to missing data on days when patients are not engaged with the VA health system. To assess patterns of service utilization and corresponding rates of missingness, we calculated descriptive statistics of the frequency of encounters, defined as any inpatient or outpatient service documented in the EHR. We calculated the count and proportion of patients, person-days, and person-months with at least one encounter in VA during the data collection period. We also calculated the mean and standard deviation of the number of encounters per month. To assess the number of clinical notes discussing housing, we repeated each calculation limited to encounters that contained notes classified by ReHouSED as &#x0201C;Stable&#x0201D; or &#x0201C;Unstable.&#x0201D; To explore whether rates of encounter frequency differed between stably and unstably housed individuals, which could cause bias in longitudinal analyses, we stratified these statistics by whether they were ever unstably housed during the data collection period. We visually characterized encounter frequency in these two groups by plotting encounters over time using an abacus plot (Lokku et al., <xref ref-type="bibr" rid="B14">2021</xref>).</p>
</sec>
<sec>
<title>2.4.3. Validity of EHR indicators</title>
<p>We assessed the accuracy of each individual EHR indicator for differentiating stable vs. unstable housing. First, we calculated the proportion of ever unstably housed and never unstably housed patients who had each indicator. Indicators found to be present for less than two unstably housed patients were excluded from subsequent analyses. For the remaining indicators, we calculated encounter- and month-level sensitivity and specificity for each indicator. For encounter-level performance, we calculated sensitivity as the proportion of encounters during an episode of unstable housing where that indicator was present, and specificity as the proportion of encounters during stable episodes that did not have the indicator. We considered each of the EHR indicators individually as well as different combinations of EHR indicators (e.g., NLP and ICD-10 codes denoting housing instability). Bootstrapping was used to construct 90% confidence intervals.</p>
<p>A limitation of measuring the performance of EHR indicators at the encounter level is that many VA visits may not include documentation of a patient&#x00027;s housing status. For example, visits for medical/surgical procedures generally do not include documentation of housing status and would be counted as false negatives in the encounter-level sensitivity. To account for this, we first limited the data to encounters where the patient had at least one note classified as &#x0201C;Stable&#x0201D; or &#x0201C;Unstable&#x0201D; by ReHouSED; this required an explicit NLP classification of housing status and does not equate the absence of documented unstable housing to stable housing. Second, we aggregated data to patient-months. For each patient, the patient&#x00027;s housing status was considered unstable if he/she reported an episode of unstable housing that overlapped with that month. A patient-month was classified as unstable if at least half of a patient&#x00027;s encounters during that time had indicators of instability. This month-level analysis was limited to patient-months that had at least one VA service use.</p>
<p>Unlike EHR data, the HOMES data records start and end dates of service use, removing the need for a patient to present for medical care to ascertain their housing status. To compare HOMES vs. EHR data, we restricted HOMES records to days in which patients had an EHR-recorded encounter, but separately calculated the total proportion of person-days (with or without an encounter) captured using HOMES data.</p>
</sec>
</sec>
</sec>
<sec id="s3">
<title>3. Results</title>
<p><xref ref-type="table" rid="T1">Table 1</xref> summarizes demographics for patients who provided self-reported housing history (&#x0201C;interviewed&#x0201D;) vs. those who did not. Among interviewed patients, most (63.9%) were &#x0003E;60 years old and 85.2% were male. Over half (54.1%) were African American. Among the entire cohort, the most common psychiatric diagnoses were major depressive (27.2%) and post-traumatic stress disorders (24.9%), with a smaller proportion of patients demonstrating evidence of drug use (13.2%), alcohol use (16.1%), or psychotic spectrum disorders (4.9%).</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>Sample demographics.</p></caption> 
<table frame="box" rules="all">
<thead>
<tr style="background-color:&#x00023;919498;color:&#x00023;ffffff">
<th valign="top" align="left"><bold>Characteristic</bold></th>
<th valign="top" align="center" colspan="2"><bold>Interviewed</bold></th>
<th/>
</tr>
<tr style="background-color:&#x00023;919498;color:&#x00023;ffffff">
<th/>
<th valign="top" align="center"><bold>Yes, <italic>n</italic> = 61</bold></th>
<th valign="top" align="center"><bold>No, <italic>n</italic> = 325</bold></th>
<th valign="top" align="center"><bold>Overall, <italic>n</italic> = 386</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Age (mean, SD, in years)</td>
<td valign="top" align="center">60.6, 11.3</td>
<td valign="top" align="center">59.7, 14.7</td>
<td valign="top" align="center">59.8, 14.2</td>
</tr> <tr>
<td valign="top" align="left">&#x0003C; 40 years (<italic>n</italic>, %)</td>
<td valign="top" align="center">2 (3.3%)</td>
<td valign="top" align="center">45 (13.8%)</td>
<td valign="top" align="center">47 (12.2%)</td>
</tr> <tr>
<td valign="top" align="left">40&#x02013;50 years (<italic>n</italic>, %)</td>
<td valign="top" align="center">11 (18.0%)</td>
<td valign="top" align="center">39 (12.0%)</td>
<td valign="top" align="center">50 (13.0%)</td>
</tr> <tr>
<td valign="top" align="left">50&#x02013;60 years (<italic>n</italic>, %)</td>
<td valign="top" align="center">9 (14.8%)</td>
<td valign="top" align="center">43 (13.2%)</td>
<td valign="top" align="center">52 (13.5%)</td>
</tr> <tr>
<td valign="top" align="left">&#x0003E;60 years (<italic>n</italic>, %)</td>
<td valign="top" align="center">39 (63.9%)</td>
<td valign="top" align="center">198 (60.9%)</td>
<td valign="top" align="center">237 (61.4%)</td>
</tr> <tr style="background-color:#e0e1e3">
<td valign="top" align="left" colspan="4"><bold>Self-identified gender (n, %)</bold></td>
</tr> <tr>
<td valign="top" align="left">Female</td>
<td valign="top" align="center">9 (14.8%)</td>
<td valign="top" align="center">28 (8.6%)</td>
<td valign="top" align="center">37 (9.6%)</td>
</tr> <tr>
<td valign="top" align="left">Male</td>
<td valign="top" align="center">52 (85.2%)</td>
<td valign="top" align="center">297 (91.4%)</td>
<td valign="top" align="center">349 (90.4%)</td>
</tr> <tr style="background-color:#e0e1e3">
<td valign="top" align="left" colspan="4"><bold>Race (</bold><italic><bold>n</bold></italic><bold>, %)</bold></td>
</tr> <tr>
<td valign="top" align="left">American Indian/Alaska Native</td>
<td valign="top" align="center">0 (0.0%)</td>
<td valign="top" align="center">11 (3.4%)</td>
<td valign="top" align="center">11 (2.8%)</td>
</tr> <tr>
<td valign="top" align="left">Black/African American</td>
<td valign="top" align="center">33 (54.1%)</td>
<td valign="top" align="center">135 (41.5%)</td>
<td valign="top" align="center">168 (43.5%)</td>
</tr> <tr>
<td valign="top" align="left">Native Hawaiian/Other Pacific Islander</td>
<td valign="top" align="center">1 (1.6%)</td>
<td valign="top" align="center">3 (0.9%)</td>
<td valign="top" align="center">4 (1.0%)</td>
</tr> <tr>
<td valign="top" align="left">White</td>
<td valign="top" align="center">24 (39.3%)</td>
<td valign="top" align="center">147 (45.2%)</td>
<td valign="top" align="center">171 (44.3%)</td>
</tr> <tr>
<td valign="top" align="left">Missing/Other</td>
<td valign="top" align="center">3 (4.9%)</td>
<td valign="top" align="center">29 (8.9%)</td>
<td valign="top" align="center">32 (8.3%)</td>
</tr> <tr style="background-color:#e0e1e3">
<td valign="top" align="left" colspan="4"><bold>Ethnicity (</bold><italic><bold>n</bold></italic><bold>, %)</bold></td>
</tr> <tr>
<td valign="top" align="left">Hispanic or Latino</td>
<td valign="top" align="center">3 (4.9%)</td>
<td valign="top" align="center">40 (12.3%)</td>
<td valign="top" align="center">43 (11.1%)</td>
</tr> <tr>
<td valign="top" align="left">Not Hispanic or Latino</td>
<td valign="top" align="center">56 (91.8%)</td>
<td valign="top" align="center">269 (82.8%)</td>
<td valign="top" align="center">325 (84.2%)</td>
</tr> <tr>
<td valign="top" align="left">Missing/Other</td>
<td valign="top" align="center">2 (3.3%)</td>
<td valign="top" align="center">16 (4.9%)</td>
<td valign="top" align="center">18 (4.7%)</td>
</tr> <tr style="background-color:#e0e1e3">
<td valign="top" align="left" colspan="4"><bold>Psychiatric and substance use disorders (</bold><italic><bold>n</bold></italic><bold>, %)</bold></td>
</tr> <tr>
<td valign="top" align="left">Bipolar disorder</td>
<td valign="top" align="center">1 (1.6%)</td>
<td valign="top" align="center">8 (2.5%)</td>
<td valign="top" align="center">9 (2.3%)</td>
</tr> <tr>
<td valign="top" align="left">Major depressive disorder</td>
<td valign="top" align="center">19 (31.1%)</td>
<td valign="top" align="center">86 (26.5%)</td>
<td valign="top" align="center">105 (27.2%)</td>
</tr> <tr>
<td valign="top" align="left">Anxiety disorder</td>
<td valign="top" align="center">9 (14.8%)</td>
<td valign="top" align="center">56 (17.2%)</td>
<td valign="top" align="center">65 (16.8%)</td>
</tr> <tr>
<td valign="top" align="left">Post-traumatic stress disorders</td>
<td valign="top" align="center">16 (26.2%)</td>
<td valign="top" align="center">80 (24.6%)</td>
<td valign="top" align="center">96 (24.9%)</td>
</tr> <tr>
<td valign="top" align="left">Schizophrenia spectrum and other psychiatric disorders</td>
<td valign="top" align="center">2 (3.3%)</td>
<td valign="top" align="center">17 (5.2%)</td>
<td valign="top" align="center">19 (4.9%)</td>
</tr> <tr>
<td valign="top" align="left">Alcohol use disorder</td>
<td valign="top" align="center">8 (13.1%)</td>
<td valign="top" align="center">54 (16.6%)</td>
<td valign="top" align="center">62 (16.1%)</td>
</tr>
<tr>
<td valign="top" align="left">Drug use disorder</td>
<td valign="top" align="center">9 (14.8%)</td>
<td valign="top" align="center">42 (12.9%)</td>
<td valign="top" align="center">51 (13.2%)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>N, number of patients; SD, standard deviation.</p>
</table-wrap-foot>
</table-wrap>
<sec>
<title>3.1. Patient-reported housing status</title>
<p><xref ref-type="table" rid="T2">Table 2</xref> summarizes patient-reported housing episodes, stratified as institutional, unstable, or stable. Most of the cohort was stably housed during the period examined, with most patients (<italic>n</italic> = 56, 91.8% of all patients) reporting stable housing at least once during the period, for a total of 35,953 person-days. Fewer (<italic>n</italic> = 12, 19.7%) patients reported being unstably housed at least once, for a sum of 3,803 person-days. Episodes of stable housing typically lasted longer than episodes of unstable housing (mean 486 days vs. 200 days). Very few (<italic>n</italic> = 4, 6.6%) patients reported time spent in institutions, accounting for a total of 112 person-days. These 112 days (presumed to be hospitalizations) are excluded in subsequent analyses.</p>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p>Summary of patient-reported housing status episodes from 7/1/2020 - 6/30/2022, obtained using the Residential Time-Line Follow Back (TLFB) inventory on a cohort of 61 patients.</p></caption> 
<table frame="box" rules="all">
<thead>
<tr style="background-color:&#x00023;919498;color:&#x00023;ffffff">
<th valign="top" align="left"><bold>Characteristic</bold></th>
<th valign="top" align="center"><bold>Institutional</bold></th>
<th valign="top" align="center"><bold>Stable</bold></th>
<th valign="top" align="center"><bold>Unstable</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Number (%) of patients reporting at least one housing episode (total number of patients = 61)</td>
<td valign="top" align="center">4 (6.6%)</td>
<td valign="top" align="center">56 (91.8%)</td>
<td valign="top" align="center">12 (19.7%)</td>
</tr> <tr>
<td valign="top" align="left">Number (%) of episodes in each category (total number of episodes = 97)</td>
<td valign="top" align="center">4 (4.1%)</td>
<td valign="top" align="center">74 (76.3%)</td>
<td valign="top" align="center">19 (19.6%)</td>
</tr> <tr>
<td valign="top" align="left">Number (%) person days spent in each category (total number of person-days = 39,868)</td>
<td valign="top" align="center">112 (0.3%)</td>
<td valign="top" align="center">35,953 (90.2%)</td>
<td valign="top" align="center">3,803 (9.5%)</td>
</tr> <tr style="background-color:#e0e1e3">
<td valign="top" align="left" colspan="4"><bold>Episode duration, in days</bold></td>
</tr> <tr>
<td valign="top" align="left">Minimum</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">38</td>
<td valign="top" align="center">3</td>
</tr> <tr>
<td valign="top" align="left">Maximum</td>
<td valign="top" align="center">74</td>
<td valign="top" align="center">729</td>
<td valign="top" align="center">667</td>
</tr> <tr>
<td valign="top" align="left">Mean (SD)</td>
<td valign="top" align="center">28 (33.1)</td>
<td valign="top" align="center">485.9 (253.4)</td>
<td valign="top" align="center">200.2 (226.6)</td>
</tr>
<tr>
<td valign="top" align="left">Median</td>
<td valign="top" align="center">18</td>
<td valign="top" align="center">578</td>
<td valign="top" align="center">91</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>SD, Standard deviation.</p>
</table-wrap-foot>
</table-wrap>
<p>The coefficients for the logistic regression model of housing instability at any point are shown in <xref ref-type="table" rid="T3">Table 3</xref>. There was no significant association between housing instability and any demographic variables (i.e., race, ethnicity, age, or gender) and housing instability, but there was some evidence of higher odds of housing instability for patients diagnosed with one or more psychiatric disorders (odds ratio = 7.85, 90% confidence interval = [1.61, 56.4]), as well as one or more substance use disorders (22.7 [4.75, 146]).</p>
<table-wrap position="float" id="T3">
<label>Table 3</label>
<caption><p>Coefficients for logistic regression model relating baseline characteristics and diagnoses and reporting housing instability at any point between 7/1/2020-6/30/2022 for a sample cohort 61 patients.</p></caption> 
<table frame="box" rules="all">
<thead>
<tr style="background-color:&#x00023;919498;color:&#x00023;ffffff">
<th valign="top" align="left"><bold>Characteristic</bold></th>
<th valign="top" align="center"><bold>OR</bold></th>
<th valign="top" align="center"><bold>90% CI</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Age</td>
<td valign="top" align="center">0.99</td>
<td valign="top" align="center">0.93, 1.06</td>
</tr> <tr>
<td valign="top" align="left">Ethnicity not Hispanic or Latino</td>
<td valign="top" align="center">REF</td>
<td valign="top" align="center">REF</td>
</tr> <tr>
<td valign="top" align="left">Hispanic or Latino</td>
<td valign="top" align="center">0.10</td>
<td valign="top" align="center">0.00, 1.54</td>
</tr> <tr>
<td valign="top" align="left">Race<break/> White</td>
<td valign="top" align="center">REF</td>
<td valign="top" align="center">REF</td>
</tr> <tr>
<td valign="top" align="left">Non-white</td>
<td valign="top" align="center">0.30</td>
<td valign="top" align="center">0.06, 1.32</td>
</tr> <tr>
<td valign="top" align="left">Gender<break/> Male</td>
<td valign="top" align="center">REF</td>
<td valign="top" align="center">REF</td>
</tr> <tr>
<td valign="top" align="left">Female</td>
<td valign="top" align="center">1.01</td>
<td valign="top" align="center">0.08, 7.49</td>
</tr> <tr>
<td valign="top" align="left">Any psychiatric disorder<xref ref-type="table-fn" rid="TN1"><sup>&#x0002A;</sup></xref></td>
<td valign="top" align="center">7.85</td>
<td valign="top" align="center">1.61, 56.4</td>
</tr>
<tr>
<td valign="top" align="left">Substance use disorder<xref ref-type="table-fn" rid="TN2"><sup>&#x0002A;&#x0002A;</sup></xref></td>
<td valign="top" align="center">22.7</td>
<td valign="top" align="center">4.75, 146</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>OR, Odds ratio; CI, Confidence interval.</p>
<fn id="TN1"><label>&#x0002A;</label><p>Psychiatric disorders include bipolar disorder, major depressive disorder, anxiety disorders, post-traumatic stress disorders, or schizophrenia spectrum/other psychotic disorders.</p></fn>
<fn id="TN2"><label>&#x0002A;&#x0002A;</label><p>Substance use disorders include alcohol use disorder, cannabis use disorder, cocaine use disorder, opioid use disorder, hallucinogen use disorder, sedative use disorder, and other stimulants/psychoactives use disorders.</p></fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec>
<title>3.2. EHR encounters</title>
<p>Most (58) patients had an encounter at some point over the 2 years. Patients who experienced unstable housing had more encounters per month compared to patients who remained stably housed (mean 7.0 vs. 5.1, ratio = 1.37). Limiting to encounters with notes mentioning housing, this ratio increased slightly (mean 3.6 vs. 2.4, ratio = 1.5). Similarly, patients with unstable housing experiences had a higher probability of having at least one encounter in a given month. This difference in visit frequency is shown visually in <xref ref-type="fig" rid="F2">Figure 2</xref>, which plots visit frequency over the 1st year of the study period for a randomly selected subsample of 12 patients with no unstable housing (top panel) and the 12 patients who reported unstable housing (bottom). Points represent an encounter at the specified time point, with shape representing the patient&#x00027;s reported housing status at the time (unstable encounters are marked by solid circles, while stable encounters are marked by an &#x0201C;x&#x0201D;). There is clear variation across patients in visit frequency. Unstable episodes are characterized by dense clusters of visits, while periods of stable housing tend to be sparser and more spread out, suggesting that this population of patients may interact with the VA healthcare system less frequently during long periods of housing stability</p>
<fig id="F2" position="float">
<label>Figure 2</label>
<caption><p>An abacus plot displaying the frequency of patient visits over time. The <bold>top</bold> panel displays visits for a subsample of patients who were stably housed during the first year of the assessment period. The <bold>bottom</bold> panel display panels for patients who were unstably housed at some point in the assessment period, with encounters on unstably housed days shown in solid circles.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frai-06-1187501-g0002.tif"/>
</fig>
</sec>
<sec>
<title>3.3. Validity of EHR indicators</title>
<p>Of the 12 patients who reported at least one unstably housed experience on the TLFB, 11 (91.6%) had some documentation of unstable housing over the assessment period, while 1 (8.4%) did not have any data elements indicating housing instability. NLP, ICD-10 codes, and outpatient administrative data were each present for all of these 11 patients, while the inpatient variables and the homelessness screener were each used with only 1 patient. Most (8/12, 66.7%) patients with unstable housing experiences were recorded in HOMES as having received homeless services.</p>
<p>We examined encounter- and month-level sensitivity and specificity for NLP, ICD-10 codes, outpatient data, and HOMES, as well as combinations of the structured EHR data and NLP. <xref ref-type="table" rid="T4">Table 4</xref> shows the results for individual indicators, combinations of NLP and ICD-10 codes, and combinations of NLP and any structured data, including VA-specific data elements; data were restricted to person-days and months where the patient had a VA encounter. At the encounter level, NLP displayed higher sensitivity (0.197, bootstrapped 90% CI = [0.143, 0.251]) than ICD-10 codes (0.098 [0.039, 0.157]) and outpatient data (0.102 [0.074, 0.129]), but lower sensitivity than HOMES (0.268 [0.076, 0.459]). Bootstrapped confidence intervals for sensitivity were wide due to the small number of unstably housed patients The widest confidence intervals were observed for HOMES data due to high between-subject variation (i.e., only 66.7% of unstably housed patients were in the registry). Encounter-level specificity was highest for HOMES (0.969 [0.947, 0.990]) and outpatient data (0.967 [0.950, 0.983]), and lower for NLP (0.948 [0.936, 0.960]) and ICD-10 codes (0.943 [0.922, 0.964]).</p>
<table-wrap position="float" id="T4">
<label>Table 4</label>
<caption><p>Sensitivity and specificity, and confidence intervals, for four EHR indicators of unstable housing at the encounter and month level.</p></caption> 
<table frame="box" rules="all">
<thead>
<tr style="background-color:&#x00023;919498;color:&#x00023;ffffff">
<th/>
<th valign="top" align="center" colspan="2"><bold>Encounter</bold></th>
<th valign="top" align="center" colspan="2"><bold>Encounters with notes documenting housing status</bold></th>
<th valign="top" align="center" colspan="2"><bold>Month</bold></th>
</tr>
<tr style="background-color:&#x00023;919498;color:&#x00023;ffffff">
<th valign="top" align="left"><bold>EHR indicator</bold></th>
<th valign="top" align="center"><bold>Sensitivity (</bold><italic><bold>n</bold></italic> = <bold>796)</bold></th>
<th valign="top" align="center"><bold>Specificity (</bold><italic><bold>n</bold></italic> = <bold>4,932)</bold></th>
<th valign="top" align="center"><bold>Sensitivity (</bold><italic><bold>n</bold></italic> = <bold>228)</bold></th>
<th valign="top" align="center"><bold>Specificity (</bold><italic><bold>n</bold></italic> = <bold>749)</bold></th>
<th valign="top" align="center"><bold>Sensitivity (</bold><italic><bold>n</bold></italic> = <bold>114)</bold></th>
<th valign="top" align="center"><bold>Specificity (</bold><italic><bold>n</bold></italic> = <bold>962)</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">NLP</td>
<td valign="top" align="center">0.197 (0.143, 0.251)</td>
<td valign="top" align="center">0.948 (0.936, 0.960)</td>
<td valign="top" align="center"><bold>0.689 (0.595, 0.782)</bold></td>
<td valign="top" align="center">0.658 (0.599, 0.717)</td>
<td valign="top" align="center"><bold>0.421 (0.313, 0.529)</bold></td>
<td valign="top" align="center">0.876 (0.847, 0.906)</td>
</tr> <tr>
<td valign="top" align="left">ICD-10</td>
<td valign="top" align="center">0.098 (0.039, 0.157)</td>
<td valign="top" align="center">0.943 (0.922, 0.964)</td>
<td valign="top" align="center">0.224 (0.095, 0.352)</td>
<td valign="top" align="center">0.862 (0.820, 0.904)</td>
<td valign="top" align="center">0.298 (0.207, 0.389)</td>
<td valign="top" align="center">0.858 (0.809, 0.907)</td>
</tr> <tr>
<td valign="top" align="left">Outpatient admin</td>
<td valign="top" align="center">0.102 (0.074, 0.129)</td>
<td valign="top" align="center">0.967 (0.950, 0.983)</td>
<td valign="top" align="center">0.259 (0.190, 0.328)</td>
<td valign="top" align="center">0.919 (0.872, 0.965)</td>
<td valign="top" align="center">0.360 (0.238, 0.481)</td>
<td valign="top" align="center">0.878 (0.826, 0.931)</td>
</tr> <tr>
<td valign="top" align="left">HOMES</td>
<td valign="top" align="center"><bold>0.268 (0.076, 0.459)</bold></td>
<td valign="top" align="center"><bold>0.969 (0.947, 0.990)</bold></td>
<td valign="top" align="center">0.311 (0.063, 0.560)</td>
<td valign="top" align="center"><bold>0.928 (0.869, 0.986)</bold></td>
<td valign="top" align="center">0.254 (0.082, 0.427)</td>
<td valign="top" align="center"><bold>0.964 (0.935, 0.992)</bold></td>
</tr> <tr>
<td valign="top" align="left">NLP or ICD-10</td>
<td valign="top" align="center"><bold>0.246 (0.187, 0.306)</bold></td>
<td valign="top" align="center">0.900 (0.873, 0.928)</td>
<td valign="top" align="center"><bold>0.741 (0.653, 0.830)</bold></td>
<td valign="top" align="center">0.581 (0.523, 0.638)</td>
<td valign="top" align="center"><bold>0.535 (0.433, 0.637)</bold></td>
<td valign="top" align="center">0.778 (0.727, 0.828)</td>
</tr> <tr>
<td valign="top" align="left">NLP and ICD-10</td>
<td valign="top" align="center">0.049 (0.012, 0.086)</td>
<td valign="top" align="center"><bold>0.991 (0.987, 0.995)</bold></td>
<td valign="top" align="center">0.171 (0.055, 0.287)</td>
<td valign="top" align="center"><bold>0.940 (0.917, 0.963)</bold></td>
<td valign="top" align="center">0.184 (0.119, 0.250)</td>
<td valign="top" align="center"><bold>0.956 (0.938, 0.974)</bold></td>
</tr> <tr>
<td valign="top" align="left">Any structured</td>
<td valign="top" align="center">0.377 (0.206, 0.548)</td>
<td valign="top" align="center">0.897 (0.866, 0.927)</td>
<td valign="top" align="center">0.592 (0.410, 0.774)</td>
<td valign="top" align="center">0.768 (0.697, 0.838)</td>
<td valign="top" align="center">0.518 (0.416, 0.619)</td>
<td valign="top" align="center">0.775 (0.711, 0.840)</td>
</tr> <tr>
<td valign="top" align="left">NLP or any structured</td>
<td valign="top" align="center"><bold>0.450 (0.298, 0.602)</bold></td>
<td valign="top" align="center">0.861 (0.826, 0.895)</td>
<td valign="top" align="center"><bold>0.846 (0.769, 0.924)</bold></td>
<td valign="top" align="center">0.531 (0.464, 0.599)</td>
<td valign="top" align="center"><bold>0.640 (0.525, 0.756)</bold></td>
<td valign="top" align="center">0.712 (0.649, 0.775)</td>
</tr>
<tr>
<td valign="top" align="left">NLP and any structured</td>
<td valign="top" align="center">0.124 (0.068, 0.181)</td>
<td valign="top" align="center"><bold>0.984 (0.978, 0.990)</bold></td>
<td valign="top" align="center">0.434 (0.272, 0.596)</td>
<td valign="top" align="center"><bold>0.895 (0.853, 0.936)</bold></td>
<td valign="top" align="center">0.298 (0.218, 0.378)</td>
<td valign="top" align="center"><bold>0.940 (0.916, 0.964)</bold></td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p><italic>n</italic>, Number of encounters (columns 1-2), encounters with notes (columns 3-4), and patient-months (columns 5-6); NLP, Natural language processing; ICD-10, International Classification of Diseases (10th edition); HOMES, Homelessness service registry data.</p>
<p><sup>&#x0002A;</sup>Structured data = ICD-10, outpatient data, or HOMES.</p>
<p>The highest individual and compositive sensitivity and specificity are shown in bold.</p>
</table-wrap-foot>
</table-wrap>
<p>When limited to encounters with notes pertaining to housing, NLP had the highest sensitivity (0.689 [0.595, 0.782]) and the lowest specificity (0.658 [0.599, 0.717]). The other three indicators each saw increased sensitivity and decreased specificity, although the change was less extreme than for NLP. When aggregating to the month level, NLP again saw the highest sensitivity (0.421 [0.313, 0.529]). HOMES, which had the highest encounter-level sensitivity, had the lowest sensitivity at the patient-month level (0.254 [0.082, 0.427]) due the high percentage of patients (66.7%) who were not captured in this dataset. ICD-10 codes had the lowest sensitivity (0.298 [0.207, 0.389]) and lowest specificity (0.858 [0.809, 0.907]).</p>
<p>Composite measures using any of the three structured elements had higher sensitivity and lower specificity than any of the structured elements at each level of analysis. A similar pattern was observed when using NLP or any structured data. Requiring NLP and structured EHR data of housing instability achieved lower sensitivity and higher specificity than NLP or HOMES individually but maintained higher sensitivity as well as specificity than when using only ICD-10 codes and outpatient administrative data.</p>
<p>Across all person-days during the assessment period regardless of whether the patient had an encounter, HOMES had a sensitivity of 0.2 [0.067, 0.335] and specificity of 0.971 [0.954, 0.996]. The sensitivity achieved at the person-day level using the combination of all three EHR indicators (i.e., patients having at least one of NLP, ICD-10, or outpatient administrative data) was 0.06 [0.03, 0.08], showing an advantage of using HOMES administrative data that did not require patients to present for care.</p>
</sec>
</sec>
<sec id="s4">
<title>4. Discussion</title>
<p>We compared patient-reported housing history with clinical and administrative data regarding housing status for a cohort of homeless-experienced VA patients. Our goal was to compare the validity of different data elements to identify best practices for assessing longitudinal housing outcomes using EHR data. Among the small number of patients who experienced housing instability in our cohort, most had EHR documentation of their housing status. Using NLP to supplement standard structured data elements with information recorded in clinical notes NLP led to more complete assessment of longitudinal housing outcomes. This is an important finding with methodologic implications for optimizing the validity of assessing patients&#x00027; longitudinal housing outcomes using EHR data when patient-level data collection is not feasible due to sample size or resource constraints.</p>
<p>In these analyses, sensitivity and specificity varied by EHR extraction method. NLP generally had higher sensitivity than structured EHR data for capturing repeated occurrences of housing instability, but demonstrated lower specificity than some structured elements. ICD-10 codes, which are often used in epidemiologic studies, had lower sensitivity and specificity than most other indicators, including NLP. Combining NLP and ICD-10 codes increased sensitivity but decreased specificity. These findings build on prior work with ReHouSED in a distinct cohort of VA patients engaged in rapid rehousing (Chapman et al., <xref ref-type="bibr" rid="B4">2021</xref>); at the patient-month level, both analyses provide evidence that ReHouSED performs better than ICD-10 codes in measuring housing instability.</p>
<p>The VA EHR contains data elements for documenting housing instability that are unique to VA. In particular, outpatient administrative data had higher specificity than NLP and higher sensitivity than ICD-10 codes. Combinations of these three elements could be used to tailor definitions to improve sensitivity or specificity as appropriate for a particular cohort or analysis. Additionally, while encounter- and month-level performance varied across different data elements, patient-level sensitivity was similarly high for NLP, ICD-10 codes, and outpatient administrative data, suggesting structured data may be sufficient for constructing coarse definitions of housing instability (e.g., identifying patients with a history of housing instability at any point in time).</p>
<p>When patients received services recorded in HOMES, those episodes of housing instability were captured with high sensitivity and specificity. However, this dataset does not capture an important segment of the population that is disengaged from VA homeless services; our data suggests that quality improvement leaders and researchers using HOMES to assess housing outcomes should consider complementing this data with EHR data elements. These findings parallel prior work (Tsai et al., <xref ref-type="bibr" rid="B23">2022</xref>) comparing estimated prevalence of homelessness across VA, which found that utilizing multiple EHR data elements can improve ascertainment of housing instability.</p>
<p>When deciding how to define housing instability using EHR data, we suggest that specific analytic goals and the underlying prevalence of housing instability be taken into consideration. Analyses examining cohorts with low prevalence of housing instability, as we had here, may demand high specificity to avoid large numbers of false positives. Specificity can be improved by requiring multiple data elements to show evidence of housing instability or by favoring more specific data elements. When high sensitivity is more desirable, using NLP or the union of multiple data elements may be more effective. Attention should also be given to missing data, as EHR data depends on patients presenting for care. Patients experiencing housing instability may use care more frequently, leading to an imbalance in the degree of observation for stably and unstably housed patients. To avoid biased results, longitudinal analyses of housing instability using EHR data should consider utilizing methods for adjusting for missing data and irregular observations (Lin et al., <xref ref-type="bibr" rid="B13">2004</xref>; Pullenayegum and Lim, <xref ref-type="bibr" rid="B21">2016</xref>; Pullenayegum and Scharfstein, <xref ref-type="bibr" rid="B22">2022</xref>).</p>
<p>This work has limitations. First, we performed these exploratory analyses on a small sample and thus our statistical analyses had had low power. Regardless, the detailed patient-reported housing history we obtained over a 2-year period in patients with homeless experiences is a valuable observational dataset and our findings will inform future work. As with any retrospective analyses using patient-reported data, there is a possibility of recall or recruitment bias in our sample. Interviewed patients differed slightly in terms of race/ethnicity (i.e., interviewed patients were more likely to be African-American than the rest of the cohort and less likely to be Hispanic/Latino). They had similar distributions of psychiatric and substance use diagnoses, although the reported proportions only represent patients receiving clinical services related to these conditions and may not be reliable due to the inaccuracy of ICD-10 coding. To check for possible differential housing instability, we compared the EHR documentation of housing instability between interviewed and non-interviewed patients and found the two groups to be similar in terms of the frequency of documented housing instability, offering some assurance against recruitment bias; however, such bias remains a possibility. Second, we treated each indicator of housing instability as dichotomous. However, accuracy may be improved by factoring information such as the number of notes processed by the NLP during a single encounter or different levels of structured data (e.g., ICD-10 codes indicating risk of homelessness vs. literal homelessness). Third, we examined a cohort of VA patients from one geographic area enrolled in a particular housing program. The observed patterns here of housing instability and EHR documentation may not generalize to other cohorts of Veterans or to populations outside of the VA, who demonstrate different demographic characteristics and documentation patterns. However, documentation of housing and other SDoH is common in clinical texts, and ICD-10 codes are widely used across healthcare systems. We demonstrated here that ReHouSED could be tailored for a new cohort and analysis task, and other work has demonstrated the feasibility of customizing NLP systems developed in VA to be applied in other settings (Chapman et al., <xref ref-type="bibr" rid="B3">2022</xref>). Additionally, this analysis was performed using data from the VA&#x00027;s legacy EHR, VISTA, which is planned to be replaced by Cerner. Future work should compare these findings with data in Cerner to ensure continuing data quality and accuracy.</p>
</sec>
<sec id="s5">
<title>5. Conclusions</title>
<p>Longitudinal housing status is an important outcome for patients who have experienced homelessness. For a sample of 61 homeless-experienced VA patients enrolled in a case management program, we found that housing status was documented longitudinally in the EHR using several structured and unstructured data elements. Using NLP to extract information from clinical notes can improve sensitivity for assessing housing outcomes, while incorporating multiple EHR indicators of housing instability achieves higher specificity compared to single indicators. Future work could customize ReHouSED for processing clinical texts within and outside VA for distinct patient cohorts, augmented by other EHR elements. Similar approaches could also be employed to evaluate other SDoH variables longitudinally using NLP.</p>
</sec>
<sec sec-type="data-availability" id="s6">
<title>Data availability statement</title>
<p>The datasets presented in this article are not readily available because due to the sensitive and protected nature of this data, the authors are unable to make it available to the public. Requests to access the datasets should be directed to <email>alec.chapman&#x00040;hsc.utah.edu</email>.</p>
</sec>
<sec sec-type="ethics-statement" id="s7">
<title>Ethics statement</title>
<p>The studies involving human participants were reviewed and approved by VA Central Institutional Review Board, U.S. Department of Veterans Affairs. Written informed consent for participation was not required for this study in accordance with the national legislation and the institutional requirements.</p>
</sec>
<sec sec-type="author-contributions" id="s8">
<title>Author contributions</title>
<p>AC contributed to conceptualization, study design, NLP system development, data curation, data analysis, system evaluation, and manuscript preparation. KCo and SG contributed to conceptualization, study design, data curation, system evaluation, and manuscript preparation. SC, TP, and DA contributed to conceptualization, study design, data curation, primary data collection, and manuscript preparation. NJ contributed to conceptualization, study design, data analysis, and manuscript preparation. KCl and JT contributed to data curation and manuscript preparation. RN and AM contributed to conceptualization, study design, NLP system development, data curation, and manuscript preparation. EF contributed to conceptualization, study design, and manuscript preparation. All authors contributed to the article and approved the submitted version.</p>
</sec>
</body>
<back>
<sec sec-type="funding-information" id="s9">
<title>Funding</title>
<p>This study was supported by QUERI-VISN (Quality Enhancement Research Initiative-Veterans Integrated Services Networks) Partnered Implementation Initiative (PII) 21-285 (Multiple Principal Investigators: Gabrielian, Cordasco, Finley).</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s10">
<title>Publisher&#x00027;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="s11">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/frai.2023.1187501/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/frai.2023.1187501/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table_1.XLSX" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Blow</surname> <given-names>F. C.</given-names></name> <name><surname>McCarthy</surname> <given-names>J. F.</given-names></name> <name><surname>Valenstein</surname> <given-names>M.</given-names></name> <name><surname>Austin</surname> <given-names>K.</given-names></name> <name><surname>Gillon</surname> <given-names>L.</given-names></name></person-group> (<year>2004</year>). <source>Care for Veterans with Psychosis in the Veterans Health Administration, FY</source>04, 6th. Annual National Psychosis Registry Report.</citation>
</ref>
<ref id="B2">
<citation citation-type="web"><person-group person-group-type="author"><name><surname>Botsis</surname> <given-names>T.</given-names></name> <name><surname>Hartvigsen</surname> <given-names>G.</given-names></name> <name><surname>Chen</surname> <given-names>F.</given-names></name> <name><surname>Weng</surname> <given-names>C.</given-names></name></person-group> (<year>2010</year>). <article-title>Secondary Use of EHR: sata Quality Issues and Informatics Opportunities</article-title>. <source>AMIA Jt. Summits Transl. Sci. Proc</source>. <volume>2010</volume>, <fpage>1</fpage>&#x02013;<lpage>5</lpage>. Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC3041534/">https://www.ncbi.nlm.nih.gov/pmc/articles/PMC3041534/</ext-link> (accessed May 12, 2023).<pub-id pub-id-type="pmid">21347133</pub-id></citation></ref>
<ref id="B3">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chapman</surname> <given-names>A. B, Peterson, K. S.</given-names></name> <name><surname>Rutter</surname> <given-names>E.</given-names></name> <name><surname>Nevers</surname> <given-names>M.</given-names></name> <name><surname>Zhang</surname> <given-names>M.</given-names></name> <name><surname>Ying</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Development and evaluation of an interoperable natural language processing system for identifying pneumonia across clinical settings of care and institutions</article-title>. <source>JAMIA Open</source> <volume>5</volume>, <fpage>114</fpage>. <pub-id pub-id-type="doi">10.1093/JAMIAOPEN/OOAC114</pub-id><pub-id pub-id-type="pmid">36601365</pub-id></citation></ref>
<ref id="B4">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chapman</surname> <given-names>A. B.</given-names></name> <name><surname>Jones</surname> <given-names>A.</given-names></name> <name><surname>Kelley</surname> <given-names>A. T,</given-names></name> <name><surname>Jones</surname> <given-names>B.</given-names></name> <name><surname>Gawron</surname> <given-names>L.</given-names></name> <name><surname>Montgomery</surname> <given-names>A. E.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>ReHouSED: a novel measurement of veteran housing stability using natural language processing</article-title>. <source>J. Biomed. Inform</source>. <volume>122</volume>, <fpage>103903</fpage>. <pub-id pub-id-type="doi">10.1016/j.jbi.2021.103903</pub-id><pub-id pub-id-type="pmid">34474188</pub-id></citation></ref>
<ref id="B5">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Conway</surname> <given-names>M.</given-names></name> <name><surname>Keyhani</surname> <given-names>S.</given-names></name> <name><surname>Christensen</surname> <given-names>L.</given-names></name> <name><surname>South</surname> <given-names>B. R.</given-names></name> <name><surname>Vali</surname> <given-names>M.</given-names></name> <name><surname>Walter</surname> <given-names>L. C.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>Moonstone: a novel natural language processing system for inferring social risk from clinical narratives</article-title>. <source>J. Biomed. Semant</source>. <volume>10</volume>, <fpage>198</fpage>. <pub-id pub-id-type="doi">10.1186/s13326-019-0198-0</pub-id><pub-id pub-id-type="pmid">30975223</pub-id></citation></ref>
<ref id="B6">
<citation citation-type="web"><person-group person-group-type="author"><name><surname>Eyre</surname> <given-names>H.</given-names></name> <name><surname>Chapman</surname> <given-names>A. B.</given-names></name> <name><surname>andPeterson</surname> <given-names>K. S</given-names></name></person-group>. <article-title>Launching into clinical space with medspaCy: a new clinical text processing toolkit in Python</article-title>. <source>AMIA Annu. Symp. Proc.</source> (<year>2021</year>). Available online at: <ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/2106.07799">https://arxiv.org/abs/2106.07799</ext-link><pub-id pub-id-type="pmid">35308962</pub-id></citation></ref>
<ref id="B7">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gabrielian</surname> <given-names>S.</given-names></name> <name><surname>Finley</surname> <given-names>E. P.</given-names></name> <name><surname>Ganz</surname> <given-names>D. A.</given-names></name> <name><surname>Barnard</surname> <given-names>J. M.</given-names></name> <name><surname>Jackson</surname> <given-names>N. J.</given-names></name> <name><surname>Montgomery</surname> <given-names>A. E.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Comparing two implementation strategies for implementing and sustaining a case management practice serving homeless-experienced veterans: a protocol for a type 3 hybrid cluster-randomized trial</article-title>. <source>Implement. Sci</source>. <volume>17</volume>, <fpage>1</fpage>&#x02013;<lpage>16</lpage>. <pub-id pub-id-type="doi">10.1186/S13012-022-01236-1/TABLES/5</pub-id><pub-id pub-id-type="pmid">36192785</pub-id></citation></ref>
<ref id="B8">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Glicksberg</surname> <given-names>B. S.</given-names></name> <name><surname>Johnson</surname> <given-names>K. W.</given-names></name> <name><surname>Dudley</surname> <given-names>J. T.</given-names></name></person-group> (<year>2018</year>). <article-title>The next generation of precision medicine: observational studies, electronic health records, biobanks and continuous monitoring</article-title>. <source>Hum Mol. Genet</source>. <volume>27</volume>, <fpage>R56</fpage>&#x02013;<lpage>R62</lpage>. <pub-id pub-id-type="doi">10.1093/hmg/ddy114</pub-id><pub-id pub-id-type="pmid">29659828</pub-id></citation></ref>
<ref id="B9">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gundlapalli</surname> <given-names>A. V.</given-names></name> <name><surname>Carter</surname> <given-names>M. E.</given-names></name> <name><surname>Palmer</surname> <given-names>M.</given-names></name> <name><surname>Ginter</surname> <given-names>T.</given-names></name> <name><surname>Redd</surname> <given-names>A.</given-names></name> <name><surname>Pickard</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2013</year>). <article-title>Using natural language processing on the free text of clinical documents to screen for evidence of homelessness among US veterans. AMIA</article-title>. <source>Annual Symposium proceedings / AMIA Symposium AMIA Symposium</source>. <volume>2013</volume>, <fpage>537</fpage>&#x02013;<lpage>546</lpage>.<pub-id pub-id-type="pmid">24551356</pub-id></citation></ref>
<ref id="B10">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gundlapalli</surname> <given-names>A. V.</given-names></name> <name><surname>Fargo</surname> <given-names>J. D</given-names></name> <name><surname>Metraux</surname> <given-names>S.</given-names></name></person-group> (<year>2015</year>). <article-title>Military misconduct and homelessness among US veterans separated from active duty, 2001&#x02013;2012</article-title>. <source>JAMA&#x02014;J. Am. Med. Assoc</source>. <volume>314</volume>, <fpage>832</fpage>&#x02013;<lpage>834</lpage>. <pub-id pub-id-type="doi">10.1001/jama.2015.8207</pub-id><pub-id pub-id-type="pmid">26305655</pub-id></citation></ref>
<ref id="B11">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hatef</surname> <given-names>E.</given-names></name> <name><surname>Rouhizadeh</surname> <given-names>M.</given-names></name> <name><surname>Nau</surname> <given-names>C.</given-names></name> <name><surname>Xie</surname> <given-names>F.</given-names></name> <name><surname>Rouillard</surname> <given-names>C.</given-names></name> <name><surname>Abu-Nasser</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Development and assessment of a natural language processing model to identify residential instability in electronic health records&#x00027; unstructured data: a comparison of 3 integrated healthcare delivery systems</article-title>. <source>JAMIA Open</source> <volume>5</volume>, <fpage>1</fpage>&#x02013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.1093/jamiaopen/ooac006</pub-id><pub-id pub-id-type="pmid">35224458</pub-id></citation></ref>
<ref id="B12">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Herman</surname> <given-names>D.</given-names></name> <name><surname>Opler</surname> <given-names>L.</given-names></name> <name><surname>Felix</surname> <given-names>A.</given-names></name> <name><surname>Valencia</surname> <given-names>E.</given-names></name> <name><surname>Wyatt</surname> <given-names>R. J.</given-names></name> <name><surname>Susser</surname> <given-names>E. A.</given-names></name> <etal/></person-group>. (<year>2000</year>). <article-title>critical time intervention with mentally ill homeless men: impact on psychiatric symptoms</article-title>. <source>J. Nerv. Ment. Dis</source>. <volume>188</volume>, <fpage>135</fpage>&#x02013;<lpage>140</lpage>. <pub-id pub-id-type="doi">10.1097/00005053-200003000-00002</pub-id><pub-id pub-id-type="pmid">10749277</pub-id></citation></ref>
<ref id="B13">
<citation citation-type="web"><person-group person-group-type="author"><name><surname>Lin</surname> <given-names>H.</given-names></name> <name><surname>Scharfstein</surname> <given-names>D. O.</given-names></name> <name><surname>Rosenheck</surname> <given-names>R. A.</given-names></name></person-group> (<year>2004</year>). <article-title>Analysis of longitudinal data with irregular, outcome-dependent follow-up</article-title>. <source>J. Royal. Stat. Soc. Series B</source>. <volume>66</volume>, <fpage>791</fpage>&#x02013;<lpage>813</lpage>. <ext-link ext-link-type="uri" xlink:href="https://www.jstor.org/stable/3647506">https://www.jstor.org/stable/3647506</ext-link> (accessed May 12, 2023).<pub-id pub-id-type="pmid">26237289</pub-id></citation></ref>
<ref id="B14">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lokku</surname> <given-names>A.</given-names></name> <name><surname>Birken</surname> <given-names>C. S.</given-names></name> <name><surname>Maguire</surname> <given-names>J. L.</given-names></name> <name><surname>Pullenayegum</surname> <given-names>E. M.</given-names></name></person-group> (<year>2021</year>). <article-title>Summarizing the extent of visit irregularity in longitudinal data</article-title>. <source>Int. J. Biostatist</source>. <volume>3</volume>, <fpage>1</fpage>&#x02013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1515/ijb-2020-0144</pub-id><pub-id pub-id-type="pmid">32471357</pub-id></citation></ref>
<ref id="B15">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lybarger</surname> <given-names>K.</given-names></name> <name><surname>Yetisgen</surname> <given-names>M.</given-names></name> <name><surname>Uzuner</surname> <given-names>&#x000D6;.</given-names></name></person-group> (<year>2023</year>). <article-title>The 2022 n2c2/UW shared task on extracting social determinants of health</article-title>. <source>J. Am. Med. Informat. Assoc</source>. <volume>2023</volume>, <fpage>ocad012</fpage>. <pub-id pub-id-type="doi">10.1093/jamia/ocad012</pub-id><pub-id pub-id-type="pmid">36795066</pub-id></citation></ref>
<ref id="B16">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mendelson</surname> <given-names>T.</given-names></name> <name><surname>Turner</surname> <given-names>A. K.</given-names></name> <name><surname>Tandon</surname> <given-names>S. D.</given-names></name></person-group> (<year>2010</year>). <article-title>Measuring homelessness and residential stability: the residential time-line follow-back inventory. i</article-title>. <source>Commun. Psychol</source>. <volume>38</volume>, <fpage>607</fpage>&#x02013;<lpage>621</lpage>. <pub-id pub-id-type="doi">10.1002/jcop</pub-id><pub-id pub-id-type="pmid">33685434</pub-id></citation></ref>
<ref id="B17">
<citation citation-type="web"><person-group person-group-type="author"><name><surname>Montgomery</surname> <given-names>A. E.</given-names></name> <name><surname>Fargo</surname> <given-names>J. D.</given-names></name> <name><surname>Byrne</surname> <given-names>T. H.</given-names></name> <name><surname>Kane</surname> <given-names>V.</given-names></name> <name><surname>Culhane</surname> <given-names>D. P</given-names></name></person-group>. <article-title>Universal Screening for Homelessness Risk for Homelessness in the Veterans Health Administration.</article-title> (<year>2022</year>). Available online at: <ext-link ext-link-type="uri" xlink:href="http://www.ajph.org">http://www.ajph.org</ext-link> (accessed December 11, 2022).<pub-id pub-id-type="pmid">24148032</pub-id></citation></ref>
<ref id="B18">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nelson</surname> <given-names>R. E</given-names></name> <name><surname>Suo</surname> <given-names>Y</given-names></name> <name><surname>Pettey</surname> <given-names>W</given-names></name> <name><surname>Vanneman</surname> <given-names>M</given-names></name> <name><surname>Montgomery</surname> <given-names>A. E</given-names></name> <name><surname>Byrne</surname> <given-names>T.</given-names></name></person-group> (<year>2018</year>). <article-title>Costs associated with health care services accessed through VA and in the community through medicare for veterans experiencing homelessness</article-title>. <source>Health Serv. Res</source>. <volume>53</volume>, <fpage>5352</fpage>&#x02013;<lpage>5374</lpage>. <pub-id pub-id-type="doi">10.1111/1475-6773.13054</pub-id><pub-id pub-id-type="pmid">30246368</pub-id></citation></ref>
<ref id="B19">
<citation citation-type="journal"><person-group person-group-type="author"><collab>Organization W. H.</collab></person-group> (<year>2004</year>). <source>ICD-10 : International Statistical Classification of Diseases and Related Health Problems : Tenth Revision</source>.</citation>
</ref>
<ref id="B20">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Peterson</surname> <given-names>R.</given-names></name> <name><surname>Gundlapalli</surname> <given-names>A.</given-names></name></person-group> (<year>2015</year>). <article-title>Identifying homelessness among veterans using VA administrative data: opportunities to expand detection criteria</article-title>. <source>PLoS ONE</source>. <volume>10</volume>, <fpage>1</fpage>&#x02013;<lpage>14</lpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0132664</pub-id><pub-id pub-id-type="pmid">26172386</pub-id></citation></ref>
<ref id="B21">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pullenayegum</surname> <given-names>E. M.</given-names></name> <name><surname>Lim</surname> <given-names>L. S. H.</given-names></name></person-group> (<year>2016</year>). <article-title>Longitudinal data subject to irregular observation: a review of methods with a focus on visit processes, assumptions, and study design</article-title>. <source>Stat. Methods Med. Res</source>. <volume>25</volume>, <fpage>2992</fpage>&#x02013;<lpage>3014</lpage>. <pub-id pub-id-type="doi">10.1177/0962280214536537</pub-id><pub-id pub-id-type="pmid">24855119</pub-id></citation></ref>
<ref id="B22">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pullenayegum</surname> <given-names>E. M.</given-names></name> <name><surname>Scharfstein</surname> <given-names>D. O.</given-names></name></person-group> (<year>2022</year>). <article-title>Randomized trials with repeatedly measured outcomes: handling irregular and potentially informative assessment times</article-title>. <source>Epidemiol. Rev</source>. <volume>44</volume>, <fpage>121</fpage>&#x02013;<lpage>137</lpage>. <pub-id pub-id-type="doi">10.1093/epirev/mxac010</pub-id><pub-id pub-id-type="pmid">36259969</pub-id></citation></ref>
<ref id="B23">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tsai</surname> <given-names>J.</given-names></name> <name><surname>Szymkowiak</surname> <given-names>D.</given-names></name> <name><surname>Jutkowitz</surname> <given-names>E.</given-names></name></person-group> (<year>2022</year>). <article-title>Developing an operational definition of housing instability and homelessness in Veterans Health Administration&#x00027;s medical records</article-title>. <source>PLoS ONE</source>. <volume>17</volume>, <fpage>e0279973</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0279973</pub-id><pub-id pub-id-type="pmid">36584201</pub-id></citation></ref>
<ref id="B24">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>L.</given-names></name> <name><surname>Ruan</surname> <given-names>X.</given-names></name> <name><surname>Yang</surname> <given-names>P.</given-names></name> <name><surname>Liu</surname> <given-names>H.</given-names></name></person-group> (<year>2016</year>). <article-title>Comparison of three information sources for smoking information in electronic health records</article-title>. <source>Cancer Inform</source>. <volume>15</volume>, <fpage>237</fpage>&#x02013;<lpage>242</lpage>. <pub-id pub-id-type="doi">10.4137/CIN.S40604</pub-id><pub-id pub-id-type="pmid">27980387</pub-id></citation></ref>
<ref id="B25">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wells</surname> <given-names>B. J.</given-names></name> <name><surname>Nowacki</surname> <given-names>A. S.</given-names></name> <name><surname>Chagin</surname> <given-names>K.</given-names></name> <name><surname>Kattan</surname> <given-names>M. W.</given-names></name></person-group> (<year>2013</year>). <article-title>Strategies for handling missing data in electronic health record derived data</article-title>. <source>eGEMs Gen. Evid. Methods Imp. Patient Outcomes</source>. <volume>1</volume>, <fpage>7</fpage>. <pub-id pub-id-type="doi">10.13063/2327-9214.1035</pub-id><pub-id pub-id-type="pmid">25848578</pub-id></citation></ref>
</ref-list> 
</back>
</article>
