<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.0 20120330//EN" "JATS-journalpublishing1.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">JDS</journal-id>
<journal-title-group><journal-title>Journal of Data Science</journal-title></journal-title-group>
<issn pub-type="epub">1683-8602</issn><issn pub-type="ppub">1680-743X</issn><issn-l>1680-743X</issn-l>
<publisher>
<publisher-name>School of Statistics, Renmin University of China</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">JDS1116</article-id>
<article-id pub-id-type="doi">10.6339/23-JDS1116</article-id>
<article-categories><subj-group subj-group-type="heading">
<subject>Data Science in Action</subject></subj-group></article-categories>
<title-group>
<article-title>Race-Specific Risk Factors for Homeownership Disparity in the Continental United States</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Richardson</surname><given-names>Rachel E.</given-names></name><email xlink:href="mailto:rachel.richardson@pnnl.gov">rachel.richardson@pnnl.gov</email><xref ref-type="aff" rid="j_jds1116_aff_001">1</xref><xref ref-type="corresp" rid="cor1">∗</xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Leach</surname><given-names>Damon T.</given-names></name><xref ref-type="aff" rid="j_jds1116_aff_001">1</xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Winans</surname><given-names>Natalie M.</given-names></name><xref ref-type="aff" rid="j_jds1116_aff_001">1</xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Degnan</surname><given-names>David J.</given-names></name><xref ref-type="aff" rid="j_jds1116_aff_001">1</xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Prymolenna</surname><given-names>Anastasiya V.</given-names></name><xref ref-type="aff" rid="j_jds1116_aff_002">2</xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Bramer</surname><given-names>Lisa M.</given-names></name><xref ref-type="aff" rid="j_jds1116_aff_001">1</xref>
</contrib>
<aff id="j_jds1116_aff_001"><label>1</label><institution>Biological Sciences Division, Pacific Northwest National Laboratory</institution>, Richland, WA, 99354, <country>USA</country></aff>
<aff id="j_jds1116_aff_002"><label>2</label><institution>Environmental Molecular Sciences Division, Pacific Northwest National Laboratory</institution>, Richland, WA, 99354, <country>USA</country></aff>
</contrib-group>
<author-notes>
<corresp id="cor1"><label>∗</label>Corresponding author. Email: <ext-link ext-link-type="uri" xlink:href="mailto:rachel.richardson@pnnl.gov">rachel.richardson@pnnl.gov</ext-link>.</corresp>
</author-notes>
<pub-date pub-type="ppub"><year>2024</year></pub-date><pub-date pub-type="epub"><day>13</day><month>12</month><year>2023</year></pub-date><volume>22</volume><issue>4</issue><fpage>591</fpage><lpage>604</lpage><supplementary-material id="S1" content-type="document" xlink:href="jds1116_s001.pdf" mimetype="application" mime-subtype="pdf">
<caption>
<title>Supplementary Material</title>
<p>Open-source code, additional visualizations and tables, as well as original datasets are available in a public GitHub repository:</p>
<p><uri>https://github.com/PNNL-CompBio/HomeownershipDisparity_2015_2019</uri></p>
<p><bold>Tables</bold> 
<list>
<list-item id="j_jds1116_li_001">
<label>•</label>
<p>Table 1: Descriptions of variables</p>
</list-item>
<list-item id="j_jds1116_li_002">
<label>•</label>
<p>Table 2: Division county percentages per Race dataset</p>
</list-item>
<list-item id="j_jds1116_li_003">
<label>•</label>
<p>Table 3: Number of counties in each dataset</p>
</list-item>
</list> 
<bold>Plots</bold> 
<list>
<list-item id="j_jds1116_li_004">
<label>•</label>
<p>Figure 1: Dataset timeline</p>
</list-item>
<list-item id="j_jds1116_li_005">
<label>•</label>
<p>Figure 2: Important variables for White models with and without outliers</p>
</list-item>
<list-item id="j_jds1116_li_006">
<label>•</label>
<p>Figure 3: Correlation between predictor variables</p>
</list-item>
<list-item id="j_jds1116_li_007">
<label>•</label>
<p>Figure 4: Model performance on 10% holdout data</p>
</list-item>
</list>
</p>
</caption>
</supplementary-material><history><date date-type="received"><day>10</day><month>12</month><year>2022</year></date><date date-type="accepted"><day>29</day><month>10</month><year>2023</year></date></history>
<permissions><copyright-statement>2024 The Author(s). Published by the School of Statistics and the Center for Applied Statistics, Renmin University of China.</copyright-statement><copyright-year>2024</copyright-year>
<license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
<license-p>Open access article under the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">CC BY</ext-link> license.</license-p></license></permissions>
<abstract>
<p>The United States has a racial homeownership gap due to a legacy of historic inequality and discriminatory policies, but factors that contribute to the racial disparity in homeownership rates between White Americans and people of color have not been fully characterized. In order to alleviate this issue, policymakers need a better understanding of how risk factors affect the homeownership rates of racial and ethnic groups differently. In this study, data from several publicly available surveys, including the American Community Survey and United States Census, were leveraged in combination with statistical learning models to investigate potential factors related to homeownership rates across racial and ethnic categories, with a focus on how risk factors vary by race or ethnicity. Our models indicated that job availability for specific demographics, and specific regions of the United States were factors that affect homeownership rates in Black, Hispanic, and Asian populations in different ways. Based on the results of this study, it is recommended policymakers promote strategies to increase access to jobs for people of color (POC), such as vocational training and programs to reduce implicit bias in hiring practices. These interventions could ultimately increase homeownership rates for POC and be a step toward reducing the racial wealth gap.</p>
</abstract>
<kwd-group>
<label>Keywords</label>
<kwd>census</kwd>
<kwd>economics</kwd>
<kwd>random forest</kwd>
<kwd>survey</kwd>
</kwd-group>
<funding-group><award-group><funding-source xlink:href="https://doi.org/10.13039/100000015">U.S. Department of Energy</funding-source><award-id>DE-AC05-76RL01830</award-id></award-group><funding-statement>PNNL is a multi-program national laboratory operated for the U.S. Department of Energy (DOE) by Battelle Memorial Institute under Contract No. DE-AC05-76RL01830. </funding-statement></funding-group>
</article-meta>
</front>
<back>
<ref-list id="j_jds1116_reflist_001">
<title>References</title>
<ref id="j_jds1116_ref_001">
<mixed-citation publication-type="journal"> <string-name><surname>Biau</surname> <given-names>G</given-names></string-name>, <string-name><surname>Scornet</surname> <given-names>E</given-names></string-name> (<year>2016</year>). <article-title>A random forest guided tour</article-title>. <source><italic>TEST</italic></source>, <volume>25</volume>(<issue>2</issue>): <fpage>197</fpage>–<lpage>227</lpage>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.1007/s11749-016-0481-7" xlink:type="simple">https://doi.org/10.1007/s11749-016-0481-7</ext-link></mixed-citation>
</ref>
<ref id="j_jds1116_ref_002">
<mixed-citation publication-type="journal"> <string-name><surname>Breiman</surname> <given-names>L</given-names></string-name> (<year>2001</year>). <article-title>Random forests</article-title>. <source><italic>Machine Learning</italic></source>, <volume>45</volume>(<issue>1</issue>): <fpage>5</fpage>–<lpage>32</lpage>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.1023/A:1010933404324" xlink:type="simple">https://doi.org/10.1023/A:1010933404324</ext-link></mixed-citation>
</ref>
<ref id="j_jds1116_ref_003">
<mixed-citation publication-type="book"> <string-name><surname>Choi</surname> <given-names>JH</given-names></string-name>, <string-name><surname>McCargo</surname> <given-names>A</given-names></string-name>, <string-name><surname>Neal</surname> <given-names>M</given-names></string-name>, <string-name><surname>Goodman</surname> <given-names>L</given-names></string-name>, <string-name><surname>Young</surname> <given-names>C</given-names></string-name> (<year>2019</year>). <source><italic>Explaining the Black-White Homeownership Gap</italic></source>, volume <volume>25</volume>. <publisher-name>Urban Institute</publisher-name>, <publisher-loc>Washington, DC</publisher-loc>. <comment>Retrieved: March 25, 2021</comment>.</mixed-citation>
</ref>
<ref id="j_jds1116_ref_004">
<mixed-citation publication-type="other"> Department of Defense (2014). Per diem rates by location. Retrieved from: <uri>https://www.travel.dod.mil/</uri>.</mixed-citation>
</ref>
<ref id="j_jds1116_ref_005">
<mixed-citation publication-type="journal"> <string-name><surname>Gabriel</surname> <given-names>SA</given-names></string-name>, <string-name><surname>Rosenthal</surname> <given-names>SS</given-names></string-name> (<year>2005</year>). <article-title>Homeownership in the 1980s and 1990s: aggregate trends and racial gaps</article-title>. <source><italic>Journal of Urban Economics</italic></source>, <volume>57</volume>(<issue>1</issue>): <fpage>101</fpage>–<lpage>127</lpage>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.1016/j.jue.2004.09.001" xlink:type="simple">https://doi.org/10.1016/j.jue.2004.09.001</ext-link></mixed-citation>
</ref>
<ref id="j_jds1116_ref_006">
<mixed-citation publication-type="other"> <string-name><surname>Hafen</surname> <given-names>R</given-names></string-name>, <string-name><surname>Schloerke</surname> <given-names>B</given-names></string-name> (<year>2021</year>). <italic>trelliscopejs: Create Interactive Trelliscope Displays</italic>. R package version 0.2.6.</mixed-citation>
</ref>
<ref id="j_jds1116_ref_007">
<mixed-citation publication-type="other"> <string-name><surname>Henry</surname> <given-names>L</given-names></string-name>, <string-name><surname>Wickham</surname> <given-names>H</given-names></string-name> (<year>2022</year>). <italic>purrr: Functional Programming Tools</italic>. R package version 0.3.5.</mixed-citation>
</ref>
<ref id="j_jds1116_ref_008">
<mixed-citation publication-type="journal"> <string-name><surname>Hilber</surname> <given-names>CA</given-names></string-name>, <string-name><surname>Liu</surname> <given-names>Y</given-names></string-name> (<year>2008</year>). <article-title>Explaining the Black–White homeownership gap: The role of own wealth, parental externalities and locational preferences</article-title>. <source><italic>Journal of Housing Economics</italic></source>, <volume>17</volume>(<issue>2</issue>): <fpage>152</fpage>–<lpage>174</lpage>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.1016/j.jhe.2008.02.001" xlink:type="simple">https://doi.org/10.1016/j.jhe.2008.02.001</ext-link></mixed-citation>
</ref>
<ref id="j_jds1116_ref_009">
<mixed-citation publication-type="journal"> <string-name><surname>Kuebler</surname> <given-names>M</given-names></string-name>, <string-name><surname>Rugh</surname> <given-names>JS</given-names></string-name> (<year>2013</year>). <article-title>New evidence on racial and ethnic disparities in homeownership in the United States from 2001 to 2010</article-title>. <source><italic>Social Science Research</italic></source>, <volume>42</volume>(<issue>5</issue>): <fpage>1357</fpage>–<lpage>1374</lpage>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.1016/j.ssresearch.2013.06.004" xlink:type="simple">https://doi.org/10.1016/j.ssresearch.2013.06.004</ext-link></mixed-citation>
</ref>
<ref id="j_jds1116_ref_010">
<mixed-citation publication-type="journal"> <string-name><surname>Liaw</surname> <given-names>A</given-names></string-name>, <string-name><surname>Wiener</surname> <given-names>M</given-names></string-name> (<year>2013</year>). <article-title>Classification and regression by randomForest</article-title>. <source><italic>R News</italic></source>, <volume>2</volume>(<issue>3</issue>): <fpage>18</fpage>–<lpage>22</lpage>.</mixed-citation>
</ref>
<ref id="j_jds1116_ref_011">
<mixed-citation publication-type="book"> <string-name><surname>McCargo</surname> <given-names>A</given-names></string-name>, <string-name><surname>Choi</surname> <given-names>JH</given-names></string-name>, <string-name><surname>Golding</surname> <given-names>E</given-names></string-name> (<year>2019</year>). <source><italic>Building Black Homeownership Bridges: A Five-Point Framework for Reducing the Racial Homeownership Gap</italic></source>. <publisher-name>Urban Institute</publisher-name>, <publisher-loc>Washington, DC</publisher-loc>.</mixed-citation>
</ref>
<ref id="j_jds1116_ref_012">
<mixed-citation publication-type="journal"> <string-name><surname>Perez</surname> <given-names>AD</given-names></string-name>, <string-name><surname>Hirschman</surname> <given-names>C</given-names></string-name> (<year>2009</year>). <article-title>The changing racial and ethnic composition of the US population: Emerging American identities</article-title>. <source><italic>Population and Development Review</italic></source>, <volume>35</volume>(<issue>1</issue>): <fpage>1</fpage>–<lpage>51</lpage>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.1111/j.1728-4457.2009.00260.x" xlink:type="simple">https://doi.org/10.1111/j.1728-4457.2009.00260.x</ext-link></mixed-citation>
</ref>
<ref id="j_jds1116_ref_013">
<mixed-citation publication-type="book"> <collab>R Core Team</collab> (<year>2020</year>). <source><italic>R: A Language and Environment for Statistical Computing</italic></source>. <publisher-name>R Foundation for Statistical Computing</publisher-name>, <publisher-loc>Vienna, Austria</publisher-loc>.</mixed-citation>
</ref>
<ref id="j_jds1116_ref_014">
<mixed-citation publication-type="other"> <string-name><surname>Ray</surname> <given-names>R</given-names></string-name>, <string-name><surname>Perry</surname> <given-names>AM</given-names></string-name>, <string-name><surname>Harshbarger</surname> <given-names>D</given-names></string-name>, <string-name><surname>Elizondo</surname> <given-names>S</given-names></string-name>, <string-name><surname>Gibbons</surname> <given-names>A</given-names></string-name> (<year>2021</year>). <italic>Homeownership, racial segregation, and policy solutions to racial wealth equity</italic>.</mixed-citation>
</ref>
<ref id="j_jds1116_ref_015">
<mixed-citation publication-type="journal"> <string-name><surname>Spearman</surname> <given-names>C</given-names></string-name> (<year>1987</year>). <article-title>The proof and measurement of association between two things</article-title>. <source><italic>The American Journal of Psychology</italic></source>, <volume>100</volume>(<issue>3/4</issue>): <fpage>441</fpage>–<lpage>471</lpage>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.2307/1422689" xlink:type="simple">https://doi.org/10.2307/1422689</ext-link></mixed-citation>
</ref>
<ref id="j_jds1116_ref_016">
<mixed-citation publication-type="other"> <string-name><surname>Strochak</surname> <given-names>S</given-names></string-name>, <string-name><surname>Ueyama</surname> <given-names>K</given-names></string-name>, <string-name><surname>Williams</surname> <given-names>A</given-names></string-name> (<year>2022</year>). <italic>urbnmapr: State and county shapefiles in sf and tibble format</italic>. R package version 0.0.0.9002.</mixed-citation>
</ref>
<ref id="j_jds1116_ref_017">
<mixed-citation publication-type="journal"> <string-name><surname>Turner</surname> <given-names>TM</given-names></string-name>, <string-name><surname>Luea</surname> <given-names>H</given-names></string-name> (<year>2009</year>). <article-title>Homeownership, wealth accumulation and income status</article-title>. <source><italic>Journal of Housing Economics</italic></source>, <volume>18</volume>(<issue>2</issue>): <fpage>104</fpage>–<lpage>114</lpage>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.1016/j.jhe.2009.04.005" xlink:type="simple">https://doi.org/10.1016/j.jhe.2009.04.005</ext-link></mixed-citation>
</ref>
<ref id="j_jds1116_ref_018">
<mixed-citation publication-type="other"> Urban Institute (2020). Household conditions by geographical school district. Retrieved from: <uri>https://datacatalog.urban.org/dataset/household-conditions-geographic-school-district</uri>. Data originally sourced from NHGIS. developed at the Urban Institute, and made available under the ODC-BY 1.0 Attribution License.</mixed-citation>
</ref>
<ref id="j_jds1116_ref_019">
<mixed-citation publication-type="other"> Urban Institute (2021a). Homeowner assistance fund county-level targeting data. Retrieved from: <uri>https://datacatalog.urban.org/dataset/homeowner-assistance-fund-county-l</uri>. Data originally sourced from NHGIS, developed at the Urban Institute, and made available under the ODC-BY 1.0 Attribution License.</mixed-citation>
</ref>
<ref id="j_jds1116_ref_020">
<mixed-citation publication-type="other"> Urban Institute (2021b). Unequal commute data. Retrieved from: <uri>https://datacatalog.urban.org/dataset/unequal-commute-data</uri>. Data originally sourced from US Census Bureau’s 2017 LEHD Origin-Destination Employment Statistics, 2014–18 American Community Survey five-year estimates, Transitland repository, OpenStreetMap, and INRIX’s 2019 Global Traffic Scorecard, developed at the Urban Institute, and made available under the ODC-BY 1.0 Attribution License.</mixed-citation>
</ref>
<ref id="j_jds1116_ref_021">
<mixed-citation publication-type="other"> Urban Institute (2022). Longitudinal Employer-household Dynamics origin-destination Employment Statistics (LODES) summary files – census tract level. Retrieved from: <ext-link ext-link-type="uri" xlink:href="https://datacatalog.urban.org/dataset/longitudinal-employer-household-dynamics-origin-destination-employment-statistics-lodes">https://datacatalog.urban.org/dataset/longitudinal-employer-household-dynamics-origin-destination-employment-statistics-lodes</ext-link>. Data originally sourced from the US Census Bureau, developed at the Urban Institute, and made available under the ODC-BY 1.0 Attribution License.</mixed-citation>
</ref>
<ref id="j_jds1116_ref_022">
<mixed-citation publication-type="other"> US Census Beaureau (2019). Travel time to work in the United States. Retrieved from: <uri>https://www.census.gov/content/dam/Census/library/publications/2021/acs/acs-47.pdf</uri>.</mixed-citation>
</ref>
<ref id="j_jds1116_ref_023">
<mixed-citation publication-type="other"> US Census Bureau (2013). Census bureau regions and divisions with state FIPS codes. Retrieved from: <uri>https://www2.census.gov/geo/pdfs/maps-data/maps/reference/</uri>.</mixed-citation>
</ref>
<ref id="j_jds1116_ref_024">
<mixed-citation publication-type="other"> US Census Bureau (2019a). Annual county resident population estimates by age, sex, race, and Hispanic origin: April 1, 2010 to July 1, 2019. Retrieved from: <uri>https://www.census.gov/data/tables/time-series/demo/popest/2010s-counties-detail.html</uri>.</mixed-citation>
</ref>
<ref id="j_jds1116_ref_025">
<mixed-citation publication-type="other"> US Census Bureau (2019b). Annual resident population estimates, estimated components of resident population change, and rates of the components of resident population change for states and counties: April 1, 2010 to July 1, 2019. Retrieved from: <uri>https://www.census.gov/data/tables/time-series/demo/popest/2010s-counties-total.html</uri>.</mixed-citation>
</ref>
<ref id="j_jds1116_ref_026">
<mixed-citation publication-type="other"> US Census Bureau (2019c). Building permits survey. Retrieved from: <uri>https://www.census.gov/construction/bps/</uri>.</mixed-citation>
</ref>
<ref id="j_jds1116_ref_027">
<mixed-citation publication-type="other"> US Census Bureau (2020a). Average household size and population density. Retrieved from: <ext-link ext-link-type="uri" xlink:href="https://covid19.census.gov/datasets/USCensus::average-household-size-and-population-density-county">https://covid19.census.gov/datasets/USCensus::average-household-size-and-population-density-county</ext-link>.</mixed-citation>
</ref>
<ref id="j_jds1116_ref_028">
<mixed-citation publication-type="other"> US Census Bureau (2020b). Highest level of educational attainment. Retrieved from: <uri>https://data.ers.usda.gov/reports.aspx?ID=17829</uri>.</mixed-citation>
</ref>
<ref id="j_jds1116_ref_029">
<mixed-citation publication-type="other"> US Census Bureau (2022). American Community Survey 1-year estimates: New England Division. Retrieved from: <uri>https://censusreporter.org/profiles/03000US1-new-england-division/</uri>.</mixed-citation>
</ref>
<ref id="j_jds1116_ref_030">
<mixed-citation publication-type="book"> <string-name><surname>Wickham</surname> <given-names>H</given-names></string-name> (<year>2016</year>). <source><italic>ggplot2: Elegant Graphics for Data Analysis</italic></source>.</mixed-citation>
</ref>
<ref id="j_jds1116_ref_031">
<mixed-citation publication-type="other"> <string-name><surname>Wickham</surname> <given-names>H</given-names></string-name>, <string-name><surname>François Henry L</surname> <given-names>R</given-names></string-name>, <string-name><surname>Müller</surname> <given-names>K</given-names></string-name> (<year>2022</year>). <italic>dplyr: A Grammar of Data Manipulation</italic>. R package version 1.0.10.</mixed-citation>
</ref>
</ref-list>
</back>
</article>
