<?xml version='1.0' encoding='UTF-8'?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.1d1 20130915//EN" "JATS-journalpublishing1.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
  <front>
    <journal-meta id="journal-meta-653a6cf9bc6b481885747d822ed97323">
      <journal-id journal-id-type="nlm-ta">Lund University, Sweden</journal-id>
      <journal-id journal-id-type="publisher-id">Lund University, Sweden</journal-id>
      <journal-id journal-id-type="journal_submission_guidelines">https://www.tsr.international/#:~:text=Traffic%20Safety%20Research%20(TSR)%20is,Traffic%20safety%20(ICTCT)%20association.</journal-id>
      <journal-title-group>
        <journal-title>Traffic Safety Research</journal-title>
      </journal-title-group>
      <issn publication-format="print">2004-3082</issn>
    </journal-meta>
    <article-meta id="article-meta-d332e3d120a24a1cb3f94e028bc9323d">
      <article-id pub-id-type="publisher-id">e000075</article-id>
      <article-id pub-id-type="doi">10.55329/aseb7655</article-id>
      <article-categories>
        <subj-group>
          <subject>Research article</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title id="article-title-e9b0298970504fbdaba252b56f1c7f22">Applying model-based recursive partitioning to improve pedestrian exposure models to support transportation safety analyses</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author" corresp="yes">
          <contrib-id contrib-id-type="orcid">0009-0008-7378-6493</contrib-id>
          <contrib-id contrib-id-type="role">Conceptualization, Data curation, Formal analysis, Investigation, Methodology, Visualization, Writing—original draft, Writing—review &amp; editing.</contrib-id>
          <name id="n-0ee7b585d62a">
            <surname>Wiegand</surname>
            <given-names>Jakob C.</given-names>
          </name>
          <email>jakob.wiegand@psu.edu</email>
          <bio>
            <graphic xlink:href="https://typeset-prod-media-server.s3.amazonaws.com/article_uploads/b4c20676-0003-47f6-98f8-f54dc3dd1e1b/image/c284561b-d4ec-481d-9d0c-4c731d021288-ujakob_c_wiegand.png" content-type="author-image"/>
            <p>received his BS in Civil Engineering from Valparaiso University in 2022 and is currently pursuing a Ph.D. in Transportation Engineering at The Pennsylvania State University. His research interests broadly cover transportation safety, but primarily focus on safety of vulnerable roadway users – especially pedestrians. Jakob’s recent research aims to emphasize the importance of accurate exposure estimates in crash prediction modeling and equity of protections for pedestrians.</p>
          </bio>
          <xref id="x-f8ae693acee9" rid="aff-a45fa1f649b5468f9d4acfec450a9e85" ref-type="aff">1</xref>
        </contrib>
        <contrib contrib-type="author">
          <contrib-id contrib-id-type="orcid">0000-0002-0648-3360</contrib-id>
          <contrib-id contrib-id-type="role">Conceptualization, Data curation, Methodology, Supervision, Validation, Writing—review &amp; editing.</contrib-id>
          <name id="n-246f44b29d4c">
            <surname>Gayah</surname>
            <given-names>Vikash V.</given-names>
          </name>
          <bio>
            <graphic xlink:href="https://typeset-prod-media-server.s3.amazonaws.com/article_uploads/b4c20676-0003-47f6-98f8-f54dc3dd1e1b/image/9eda7b37-0a2c-4310-9daf-47da69fccbad-uvikash_v_gayah.png" content-type="author-image"/>
            <p>is a professor in the Department of Civil and Environmental Engineering at The Pennsylvania State University, where he also serves as the Interim Director of the Larson Transportation Institute. He received his B.S. and M.S. degrees from the University of Central Florida and his Ph.D. degree from the University of California, Berkeley. Dr. Gayah’s research focuses on urban mobility, traffic operations, traffic flow theory, traffic safety and non-motorized transportation. Dr. Gayah currently serves as an editorial advisory board member of Transportation Research Part C: Emerging Technologies and Accident Analysis and Prevention, an editorial board editor of Transportation Research Part B: Methodological, an associate editor for Transportation Letters and the IEEE Intelligent Transportation Systems Magazine (an international peer-reviewed journal), and a handling editor for the Transportation Research Record.</p>
          </bio>
          <xref id="x-69bd7cbd3222" rid="aff-a45fa1f649b5468f9d4acfec450a9e85" ref-type="aff">1</xref>
        </contrib>
        <contrib contrib-type="editor">
          <name id="n-dd56b8349951">
            <surname>Stamatiadis</surname>
            <given-names>Nikiforos</given-names>
          </name>
          <xref id="x-5256354ab1ba" rid="aff-957079c8bf8e4dd6b90c05748c6b636f" ref-type="aff">2</xref>
        </contrib>
        <contrib contrib-type="reviewer">
          <name id="n-f13751897c1a">
            <surname>Kiec</surname>
            <given-names>Mariusz</given-names>
          </name>
          <xref id="x-55eadbc05004" rid="a-61cb33f30796" ref-type="aff">3</xref>
        </contrib>
        <contrib contrib-type="reviewer">
          <name id="n-21c631fae7bd">
            <surname>Sewell</surname>
            <given-names>Mike</given-names>
          </name>
          <xref id="x-d6470bcf176c" rid="a-42ad91233e64" ref-type="aff">4</xref>
        </contrib>
        <aff id="aff-a45fa1f649b5468f9d4acfec450a9e85">
          <institution>The Pennsylvania State University</institution>
          <country>the United States of America</country>
        </aff>
        <aff id="aff-957079c8bf8e4dd6b90c05748c6b636f">
          <institution>University of Kentucky</institution>
          <country>the United States of America</country>
        </aff>
        <aff id="a-61cb33f30796">
          <institution>Cracow University of Technology</institution>
          <country country="PL">Poland</country>
        </aff>
        <aff id="a-42ad91233e64">
          <institution>Gresham Smith</institution>
          <country>the United States of America</country>
        </aff>
      </contrib-group>
      <pub-date date-type="pub">
        <day>17</day>
        <month>1</month>
        <year>2025</year>
      </pub-date>
      <volume>9</volume>
      <elocation-id>Guest editor</elocation-id>
      <history>
        <date date-type="received">
          <day>25</day>
          <month>5</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>18</day>
          <month>11</month>
          <year>2024</year>
        </date>
      </history>
      <permissions>
        <copyright-year>2025</copyright-year>
      </permissions>
      <abstract id="abstract-abstract-title-4a86967be4b84d5f80b3a3f6613953f2">
        <title id="abstract-title-4a86967be4b84d5f80b3a3f6613953f2">Abstract</title>
        <p id="paragraph-96736142002a474f95147a0e624b5012">Pedestrians are among the most vulnerable road users in urban areas, and their safety is a growing concern for transportation planners and engineers. Pedestrians are at disproportionately high risk for injuries or fatalities in crashes with motor vehicles, highlighting the critical need to address their safety. To address the dangers urban pedestrians face, the relationship between pedestrian crashes and their contributing factors must first be understood. One way to do this is to use statistical models relating pedestrian crash frequency with quantifiable contributing factors, such as land use, demographics, and roadway characteristics. Perhaps the most important of these factors is pedestrian exposure, which is often difficult to obtain because pedestrian volumes are not as widely available as vehicle volumes. Since pedestrian volumes are not available across an entire network, they are often estimated using statistical models—for example, negative binomial (NB) regression—rather than being directly observed. These models are typically a ‘one-size-fits-all’ approach, applying the same model to estimate pedestrian exposure across the entire network. However, relationships between pedestrian exposure and explanatory features—such as population, infrastructure design, and land use context—might differ significantly with respect to the context of an individual location. To address this issue, this paper proposes a model-based recursive partitioning (MBRP) algorithm to develop pedestrian exposure models. The MBRP approach combines traditional statistical methods (e.g. NB regression) with recursive data partitioning techniques commonly found in tree-based machine learning methods. This innovative approach yields a collection of exposure models stratified according to selected input variables with unique relationships between explanatory variables and exposure. The proposed method was tested on pedestrian exposure data from North Carolina significantly improved predictions of pedestrian volumes by approximately 10%. Therefore, the MBRP algorithm presents a promising tool for advancing pedestrian safety analyses in practical applications.</p>
      </abstract>
      <kwd-group id="kwd-group-4b7f8496b0044efaa07a9ad56ee4480a">
        <title>Keywords</title>
        <kwd>exposure model</kwd>
        <kwd>model based recursive partitioning</kwd>
        <kwd>negative binomial regression</kwd>
        <kwd>pedestrians</kwd>
        <kwd>pedestrian safety</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec>
      <title id="title-56ca6f71d8684fd0affe2a34353d6088">Introduction</title>
      <p id="paragraph-5ed2d8efcad54369bc58a96fc8107e8e">Pedestrian safety is a topic of growing concern in the United States, especially in urban areas where 84% of pedestrian fatalities in traffic crashes occur  (<xref id="x-d662c1c8c989" rid="R253150932180186" ref-type="bibr">NHTSA, 2023</xref>). Widely considered to be the most vulnerable roadway users, pedestrians are disproportionately represented in fatality statistics, and their representation is growing at an alarming rate. Data from the Fatality Analysis Reporting System (FARS) indicates that 7 388 pedestrians were killed in traffic crashes in 2021, about 19% of all traffic fatalities in the United States. As the greatest pedestrian fatality total since 1981, that pedestrian fatality total also represents a 12.5% increase from the previous year, following a trend in yearly increases dating back to 2013 when pedestrian fatalities accounted for 3% less of all traffic fatalities  (<xref id="x-db54f6e40397" rid="R253150932180198" ref-type="bibr">NHTSA, 2023</xref>). To address the growing concern for pedestrian safety, we must first understand the relationship between factors that contribute to pedestrian crashes and crash outcomes.</p>
      <p id="paragraph-ad04b822a19642a18283bd803eba009c">Often these relationships are quantified through statistical models that relate frequency of pedestrian crashes with observable factors that contribute to the crashes. Many different models have been used to investigate the relationships between pedestrian crashes and their contributing factors – most often including combinations of variables such as land use, socio-demographic information, and roadway characteristics. But perhaps the most important predictor of pedestrian safety outcomes is pedestrian exposure. Unfortunately, pedestrian exposure can be difficult to obtain because pedestrian volumes are not as widely available across a roadway network as vehicular volumes. This is because network-scale pedestrian counts are resource-intensive due to high costs associated with labor for manual counts and prices charged for automated counts. Some pedestrian volume data is more widely available from fitness-tracking sources such as Strava, but data from fitness-trackers is flawed in that they relay a self-reporting sample and the trackers are subject to error due to poor GPS reception, which is especially an issue in urban environments  (<xref id="xref-5e245cf680c5451aba72e494529f1f35" rid="R253150932180199" ref-type="bibr">Lee &amp; Sener, 2020</xref>). Accurate volumes can also be difficult to obtain and even impractical to use due to highly variable daily volumes, short trips which may not be observed, and difficulties in detecting individuals  (<xref id="x-e13e274de571" rid="R253150932180206" ref-type="bibr">Lagerwey et al., 2015</xref>). Instead of directly using counts directly, pedestrian volumes are usually estimated through statistical models.</p>
      <p id="paragraph-c959797ed7074f6eb8dc28e0525f27be">Several studies have developed pedestrian exposure models to predict the amount of pedestrian activity at a given level based on input variables that reflect the built environment, roadway features and other variables. These have traditionally been developed using log-linear ordinary least squares regression (OLS) or negative binomial (NB) regression  (<xref rid="R253150932180205" ref-type="bibr">Behnam &amp; Patel, 1977</xref>; <xref rid="R253150932180200" ref-type="bibr">Griswold et al., 2019</xref>; <xref rid="R253150932180193" ref-type="bibr">Hankey et al., 2012</xref>; <xref rid="R253150932180197" ref-type="bibr">Haynes et al., 2010</xref>; <xref rid="R253150932180191" ref-type="bibr">Lindsey et al., 2006</xref>; <xref rid="R253150932180187" ref-type="bibr">Lindsey et al., 2007</xref>; <xref rid="R253150932180183" ref-type="bibr">Liu &amp; Griswold, 2009</xref>; <xref rid="R253150932180194" ref-type="bibr">Miranda-Moreno &amp; Fernandes, 2011</xref>; <xref rid="R253150932180189" ref-type="bibr">Pulugurtha &amp; Repaka, 2008</xref>; <xref rid="R253150932180196" ref-type="bibr">Schneider et al., 2009</xref>; <xref rid="R253150932180203" ref-type="bibr">Schneider et al., 2012</xref>). Pedestrian exposure has also been estimated using Tobit models and by modifying NB regression techniques to artificially inflate zero value pedestrian counts, in both cases relating the counts to demographics, land use, and traffic data  (<xref id="xref-0b6d47d1fd3b42c8b368d25998cdaf5b" rid="R253150932180204" ref-type="bibr">Lee et al., 2019</xref>). Still other studies suggest using stepwise linear regression to account for spatial variations in independent variables  (<xref rid="R253150932180202" ref-type="bibr">Hankey &amp; Lindsey, 2016</xref>; <xref rid="R253150932180201" ref-type="bibr">Hankey et al., 2017</xref>; <xref rid="R253150932180195" ref-type="bibr">Lu et al., 2018</xref>).</p>
      <p id="paragraph-dc5b3556115a4144b7d3d56b53a87c3f">While these model types have their own merit, they also have various flaws when applied to estimating pedestrian exposure. OLS regression does not account for the count nature of volume data, and using a log-linear form assumes a logarithmic distribution that may not be observed. Similarly, Tobit models assume a normal distribution for the dependent variable which is not typically observed in pedestrian count data. Stepwise linear regression may result in atheoretical coefficient estimates, which makes interpretation complicated and may limit transferability to other datasets. NB regression is the most appropriate and the most common, because of its ability to account for overdispersion in fluctuating pedestrian volumes and the count nature of the data. Even so, all these models are flawed in that they are typically a ‘one-size-fits-all’ approach in which the same model is used to estimate pedestrian exposure at all locations within a transportation network. However, the relationships between pedestrian exposure and explanatory features—such as population, infrastructure design, and land use context—might differ significantly with respect to the context of an individual location, which may not be known a priori. Incorporating these differences could help improve the exposure model and provide more accurate predictions. </p>
      <p id="paragraph-109ed09cc96b491ea2e98e41b3526a01">To help address this issue, this paper proposes a model-based recursive partitioning (MBRP) algorithm to develop pedestrian exposure models. The MBRP approach combines traditional statistical methods (e.g. NB regression) with the recursive data partitioning techniques commonly found in tree-based machine learning methods. The proposed method was tested on pedestrian exposure data obtained in North Carolina and shown to significantly improve predictions of pedestrian volumes by approximately 10%. Therefore, the MBRP algorithm presents a promising tool for advancing pedestrian safety analysis in practical applications.</p>
      <p id="paragraph-c55c27b55af547b9ab9fe992b3f46151">The remainder of this paper is organized as follows. Section 2 provides a description of the methodology used for NB regression and the proposed MBRP approach. Section 3 describes the dataset used. Section 4 provides an analysis of the results from the MBRP model. Finally, Section 5 contains concluding remarks.</p>
    </sec>
    <sec>
      <title id="title-bf1a554d7c1f4ea4a82fed5604a0dd6d">Methodology</title>
      <p id="paragraph-9713912c60a44c41af128510d922cdf0">The goal of this research is to demonstrate the potential of the MBRP algorithm to estimate pedestrian exposure better than traditional regression methods. To do so, exposure models were developed over a training dataset using traditional NB regression methods and the MBRP algorithm. The performance of the MBRP model was judged relative to the NB regression model based on goodness of fit statistics over a separate test dataset and cumulative residual (CURE) plots.</p>
      <sec>
        <title id="title-36ba3ce79c6b4821b7dfcdf0c194df97">NB regression</title>
        <p id="paragraph-8e5dbc8c070d4c5fb9aeb30b384c90d8">Pedestrian counts are always a non-negative integer and are therefore most appropriately modeled using count models. Though there are many count regression models, NB regression models are used most extensively in research due to their ability to account for overdispersion in the dataset, which is commonly observed in pedestrian count data. This paper’s NB regression procedure is adapted from <xref id="xref-1aefff6742b44a87b6e9456901ca59ef" rid="R253150932180193" ref-type="bibr">Hankey et al. (2012)</xref> and <xref id="xref-e5c5ed0532454f308845ba671168daa8" rid="R253150932180204" ref-type="bibr">Lee et al. (2019)</xref>.</p>
        <p id="paragraph-367e78777ddc46a89cc449e269590597">NB regression can be described through the following formulation: Let <inline-formula id="inline-formula-4d946509e7ec456e84f102a8bf774ebc"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mo>,</mml:mo><mml:mn>2</mml:mn><mml:mo>,</mml:mo><mml:mn>3</mml:mn><mml:mo>,</mml:mo><mml:mo>…</mml:mo><mml:mo>,</mml:mo><mml:mi>N</mml:mi></mml:math></inline-formula> represent the index of a given location where <inline-formula id="inline-formula-8c47c7bbcdb445bb9e5ed566285006fe"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mi>N</mml:mi></mml:math></inline-formula> is the number of locations in the dataset. In the NB model, the pedestrian count at a location <inline-formula id="inline-formula-7030b1e855be4f5abd2bcb7fcc1d4dd7"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mi>i</mml:mi></mml:math></inline-formula>, takes an exponential form as shown in <xref id="x-aad29e6702b2" rid="disp-formula-group-f66678cc8f3345da8463dba4257309fb" ref-type="disp-formula">Equation 1</xref>:</p>
        <disp-formula-group id="disp-formula-group-f66678cc8f3345da8463dba4257309fb"> <disp-formula><label>1</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:msub><mml:mi>λ</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mi>E</mml:mi><mml:mfenced><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mfenced><mml:mo>=</mml:mo><mml:mi>e</mml:mi><mml:mi>x</mml:mi><mml:mi>p</mml:mi><mml:mfenced><mml:mrow><mml:mi>β</mml:mi><mml:msub><mml:mi>X</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi>ε</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mfenced></mml:math></disp-formula></disp-formula-group>
        <p id="paragraph-862d17ced05d46928098beb0c9be09ef">where <inline-formula id="inline-formula-7191ac9060df4d48be192ab607ce530e"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:msub><mml:mi>λ</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mo> </mml:mo></mml:mrow></mml:msub></mml:math></inline-formula>is the predicted pedestrian count at location <inline-formula id="inline-formula-64cd9ea6c0e744af9401dfbd6d393105"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mi>i</mml:mi></mml:math></inline-formula>, <inline-formula id="inline-formula-0ffe6cb1a7624ba2a14eda18276e3834"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:math></inline-formula> is the observed pedestrian count at location <inline-formula id="inline-formula-3994e5c1cfff4bbe999c4bfa3714924a"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mi>i</mml:mi></mml:math></inline-formula>, <inline-formula id="inline-formula-d870401d85574fa1acef5390fd5c1b13"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mi>β</mml:mi></mml:math></inline-formula> is the vector of estimated parameters, <inline-formula id="inline-formula-15437c65b0474cdc9ec3fc070f3311e2"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:msub><mml:mi>X</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mo> </mml:mo></mml:mrow></mml:msub></mml:math></inline-formula>is the associated vector of explanatory variable values observed at location <inline-formula id="inline-formula-3076864a958f4250a1ae701c005785ec"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mi>i</mml:mi></mml:math></inline-formula>, and <inline-formula id="inline-formula-9d004e8fa71d429f81d44dcf216345e6"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:msub><mml:mi>ε</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:math></inline-formula> is an error term such that <inline-formula id="inline-formula-d7dfd826f2e9430788d1db600f23b856"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mrow><mml:mrow><mml:mi>e</mml:mi><mml:mi>x</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mfenced><mml:msub><mml:mi>ε</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mfenced></mml:mrow></mml:math></inline-formula> has a gamma distribution. A maximum likelihood estimation (MLE) method was adopted using the probability distribution for NB regression as presented in <xref id="x-0e8f39a17fa2" rid="disp-formula-group-3154ae55729a42ebb24ae53bea73262b" ref-type="disp-formula">Equation 2</xref>, and the likelihood function as presented in <xref id="x-43afde643da9" rid="disp-formula-group-997791009d5e4bc1a919643d2d88dbf7" ref-type="disp-formula">Equation 3</xref>. The MLE method allows for estimation of the coefficient parameter, <inline-formula id="inline-formula-5f711e793d4c4e25b874eedea784539b"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mi>β</mml:mi></mml:math></inline-formula>, and the overdispersion parameter, <inline-formula id="inline-formula-d01158bf91264ad4a5e7cf2c362f2e41"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mi>α</mml:mi><mml:mo>,</mml:mo></mml:math></inline-formula> relying on the gamma function, denoted by <inline-formula id="inline-formula-0763966f71954db89d66a801841919cc"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mi>Γ</mml:mi><mml:mo>(</mml:mo><mml:mo>·</mml:mo><mml:mo>)</mml:mo></mml:math></inline-formula>.</p>
        <disp-formula-group id="disp-formula-group-3154ae55729a42ebb24ae53bea73262b"> <disp-formula><label>2</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mi>P</mml:mi><mml:mfenced><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mfenced><mml:mo>=</mml:mo><mml:mo> </mml:mo><mml:mfrac><mml:mrow><mml:mi>Γ</mml:mi><mml:mfenced><mml:mrow><mml:mfrac><mml:mn>1</mml:mn><mml:mi>α</mml:mi></mml:mfrac><mml:mo>+</mml:mo><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mfenced></mml:mrow><mml:mrow><mml:mi>Γ</mml:mi><mml:mfenced><mml:mfrac><mml:mn>1</mml:mn><mml:mi>α</mml:mi></mml:mfrac></mml:mfenced><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>!</mml:mo></mml:mrow></mml:mfrac><mml:msup><mml:mfenced close="]" open="["><mml:mfrac><mml:mrow><mml:mi>α</mml:mi><mml:msub><mml:mi>λ</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>+</mml:mo><mml:mi>α</mml:mi><mml:msub><mml:mi>λ</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mfrac></mml:mfenced><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:msup><mml:msup><mml:mfenced close="]" open="["><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mn>1</mml:mn><mml:mo>+</mml:mo><mml:mi>α</mml:mi><mml:msub><mml:mi>λ</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mfrac></mml:mfenced><mml:mfrac><mml:mn>1</mml:mn><mml:mi>α</mml:mi></mml:mfrac></mml:msup></mml:math></disp-formula></disp-formula-group>
        <disp-formula-group id="disp-formula-group-997791009d5e4bc1a919643d2d88dbf7"> <disp-formula><label>3</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mi>L</mml:mi><mml:mo>(</mml:mo><mml:mi>α</mml:mi><mml:mo>,</mml:mo><mml:mi>β</mml:mi><mml:mo>)</mml:mo><mml:mo> </mml:mo><mml:mo>=</mml:mo><mml:mo> </mml:mo><mml:msubsup><mml:mo>∏</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mo> </mml:mo></mml:mrow><mml:mrow><mml:mi>N</mml:mi><mml:mo> </mml:mo></mml:mrow></mml:msubsup><mml:mi>P</mml:mi><mml:mfenced><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mfenced></mml:math></disp-formula></disp-formula-group>
        <p id="paragraph-11417d110b6441cdaa0b846d60aec8d6">Selecting parameters which maximize the likelihood function presented in <xref id="x-323bf88c0560" rid="disp-formula-group-997791009d5e4bc1a919643d2d88dbf7" ref-type="disp-formula">Equation 3</xref> establishes a model expected to best fit the data. Typically, the likelihood value found by maximizing <xref id="x-92bdfee39ef4" rid="disp-formula-group-997791009d5e4bc1a919643d2d88dbf7" ref-type="disp-formula">Equation 3</xref> is very small, so frequently the natural log of <xref id="x-ffa6d8ebc113" rid="disp-formula-group-997791009d5e4bc1a919643d2d88dbf7" ref-type="disp-formula">Equation 3</xref> is optimized in place and is reported as log-likelihood.</p>
      </sec>
      <sec>
        <title id="title-3324ec8dfb0a44cc9a7aed9241af286c">MBRP algorithm</title>
        <p id="paragraph-e51407a34778454cbcdbd3e2c3e21b1a">The MBRP algorithm combines traditional statistical modeling, such as NB regression, with recursive data partitioning techniques commonly found in tree-based machine learning methods. In the MBRP algorithm, the root node is a parametric model fitted over the entire dataset. Child nodes are then formed through splitting based on a decision rule, which continues until the terminal node of the tree model is reached. <xref id="x-bb84057f7e06" rid="figure-163076f385f44165a12958ccd5363104" ref-type="fig">Figure 1</xref> depicts a general form of the tree model  (<xref id="xref-8e0ccc74d3424292b6c82f2599494ca8" rid="R253150932180184" ref-type="bibr">Kashani &amp; Mohaymany, 2011</xref>). The following formulation for the MBRP algorithm draws extensively from <xref id="x-6cbac84ac7c5" rid="R253150932180185" ref-type="bibr"> Seibold et al. (2016)</xref> and descriptions from <xref id="xref-23a5f4b182fe464cb8a661078e8a3e77" rid="R253150932180181" ref-type="bibr">Tang and Donnell (2019)</xref>. </p>
        <p id="paragraph-4ab091c2b4f34bbf8a7c96187dfd6377">Developing a model using the MBRP algorithm is a process that occurs in three steps: </p>
        <list list-type="order">
          <list-item id="li-0d692f225a30">
            <p>Fit a parametric model to all observations in the dataset;</p>
          </list-item>
          <list-item id="li-0286dce1af05">
            <p>Test coefficient stability over the splitting variable; and</p>
          </list-item>
          <list-item id="li-4111781a9571">
            <p>Determine the optimal cut point of the splitting variable.</p>
          </list-item>
        </list>
        <p id="paragraph-fa972363f9514619af5f00ff912eaf3c">In Step 1, the parametric model with parameter vector, <inline-formula id="inline-formula-7f1ee349655c414282e201cf52df5146"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mi>θ</mml:mi></mml:math></inline-formula> (represented by the root node in ) may be estimated through methods such as OLS or MLE which inform the objective function, <inline-formula id="inline-formula-f3e5ed914c8c40f9b5d6f31ac73fabc4"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mi>Ψ</mml:mi><mml:mo>(</mml:mo><mml:mo>·</mml:mo><mml:mo>)</mml:mo></mml:math></inline-formula> as found in <xref id="x-13497d791673" rid="disp-formula-group-045606e210d34960840d85995337a4e5" ref-type="disp-formula">Equation 4</xref>. The coefficients are then estimated through a partial score function as shown in <xref id="x-3273dc603cee" rid="disp-formula-group-6a8d7633c948449ab5e2a20c4fa9e196" ref-type="disp-formula">Equation 5</xref>, where <inline-formula id="inline-formula-8132e1d113914c82968671ad7eaeddc4"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mi>ψ</mml:mi><mml:mo>(</mml:mo><mml:mo>·</mml:mo><mml:mo>)</mml:mo></mml:math></inline-formula> represents the score function, and <inline-formula id="inline-formula-d64a1c412fd344faa668ba3db6b7e751"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mi>β</mml:mi></mml:math></inline-formula> is the estimated parameter  (<xref id="xref-abf5786e1b2346c9af2706af64b91a18" rid="R253150932180185" ref-type="bibr">Seibold et al., 2016</xref>).</p>
        <fig id="figure-163076f385f44165a12958ccd5363104" orientation="portrait" fig-type="graphic" position="anchor">
          <label>Figure 1 </label>
          <caption id="caption-31e9c57cd6e54b17acd3ff494e9940af">
            <title id="title-5650e58e003741359de8d3cd14afe065">General structure of a tree model (<xref id="xref-bd30b70ec3d2444b9de5cc052b40fc64" rid="R253150932180184" ref-type="bibr">Kashani &amp; Mohaymany, 2011</xref>)</title>
          </caption>
          <graphic id="graphic-0b7929749db84b05b9ff749ba6e2d26b" xlink:href="https://typeset-prod-media-server.s3.amazonaws.com/article_uploads/b4c20676-0003-47f6-98f8-f54dc3dd1e1b/image/6e34704b-bed1-4f41-bfb3-76117edcc972-ufigure_1.png"/>
        </fig>
        <disp-formula-group id="disp-formula-group-045606e210d34960840d85995337a4e5"> <disp-formula><label>4</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mover><mml:mi>θ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mo>=</mml:mo><mml:mrow><mml:mrow><mml:mi>a</mml:mi><mml:mi>r</mml:mi><mml:mi>g</mml:mi></mml:mrow><mml:mrow><mml:mi>m</mml:mi><mml:mi>i</mml:mi><mml:mi>n</mml:mi><mml:mrow><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>N</mml:mi></mml:munderover><mml:mrow><mml:mi>Ψ</mml:mi><mml:mo>(</mml:mo><mml:msub><mml:mfenced><mml:mrow><mml:mi>y</mml:mi><mml:mo>,</mml:mo><mml:mi>X</mml:mi></mml:mrow></mml:mfenced><mml:mi>i</mml:mi></mml:msub><mml:mo>,</mml:mo><mml:mo> </mml:mo><mml:mi>θ</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mrow></mml:mrow></mml:math></disp-formula></disp-formula-group>
        <disp-formula-group id="disp-formula-group-6a8d7633c948449ab5e2a20c4fa9e196"> <disp-formula><label>5</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mrow><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>N</mml:mi></mml:munderover><mml:mfrac><mml:mrow><mml:mo>∂</mml:mo><mml:mi>Ψ</mml:mi><mml:mfenced><mml:mrow><mml:msub><mml:mfenced><mml:mrow><mml:mi>y</mml:mi><mml:mo>,</mml:mo><mml:mi>X</mml:mi></mml:mrow></mml:mfenced><mml:mi>i</mml:mi></mml:msub><mml:mo>,</mml:mo><mml:mo> </mml:mo><mml:mi>θ</mml:mi></mml:mrow></mml:mfenced></mml:mrow><mml:mrow><mml:mo>∂</mml:mo><mml:mi>β</mml:mi></mml:mrow></mml:mfrac></mml:mrow><mml:mo>=</mml:mo><mml:mrow><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>N</mml:mi></mml:munderover><mml:msub><mml:mi>ψ</mml:mi><mml:mi>β</mml:mi></mml:msub></mml:mrow><mml:mfenced><mml:mrow><mml:msub><mml:mfenced><mml:mrow><mml:mi>y</mml:mi><mml:mo>,</mml:mo><mml:mi>X</mml:mi></mml:mrow></mml:mfenced><mml:mi>i</mml:mi></mml:msub><mml:mo>,</mml:mo><mml:mo> </mml:mo><mml:mi>θ</mml:mi></mml:mrow></mml:mfenced></mml:math></disp-formula></disp-formula-group>
        <p id="paragraph-044a88b1e07b41e5a530d078ef52982e">In Step 2, a generalized M-fluctuation test is used to test coefficient stability over splitting variables, with the null hypothesis stating that the partial score functions from <xref id="x-d718dd7ed643" rid="disp-formula-group-6a8d7633c948449ab5e2a20c4fa9e196" ref-type="disp-formula">Equation 5</xref> are independent of partitioning variables. This hypothesis indicates that global estimates of an independent variable are appropriate. <xref id="x-ee02f42abbc4" rid="disp-formula-group-2cfedfeab974478a99ae11b7e72dd823" ref-type="disp-formula">Equation 6</xref> shows the functional form of the null hypothesis, where <inline-formula id="inline-formula-8d13a16dd51e48fe986d9e60216d6f73"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mi>Z</mml:mi></mml:math></inline-formula> is the splitting variable and <inline-formula id="inline-formula-07b6c4bed2074140990f0e979952d081"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mi>J</mml:mi></mml:math></inline-formula> is the number of splitting variables  (<xref id="xref-1a375f3b5a88467db38fa6ca086ae8cc" rid="R253150932180185" ref-type="bibr">Seibold et al., 2016</xref>).</p>
        <disp-formula-group id="disp-formula-group-2cfedfeab974478a99ae11b7e72dd823"> <disp-formula><label>6</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:msubsup><mml:mi>H</mml:mi><mml:mn>0</mml:mn><mml:msub><mml:mi>β</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:msubsup><mml:mo>:</mml:mo><mml:mo> </mml:mo><mml:msub><mml:mi>ψ</mml:mi><mml:mi>β</mml:mi></mml:msub><mml:mfenced><mml:mrow><mml:mfenced><mml:mrow><mml:mi>Y</mml:mi><mml:mo>,</mml:mo><mml:mi>X</mml:mi></mml:mrow></mml:mfenced><mml:mo>,</mml:mo><mml:mo> </mml:mo><mml:mover><mml:mi>θ</mml:mi><mml:mo>^</mml:mo></mml:mover></mml:mrow></mml:mfenced><mml:mo>⊥</mml:mo><mml:msub><mml:mi>Z</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>,</mml:mo><mml:mo> </mml:mo><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mo>,</mml:mo><mml:mo>…</mml:mo><mml:mo>,</mml:mo><mml:mi>J</mml:mi></mml:math></disp-formula></disp-formula-group>
        <p id="paragraph-4d5da6aedc4345d3a4091f7f90e706fb">The splitting variable is selected based on the greatest correlation with partial score functions, and the optimal cut point of the splitting variable is determined by evaluating segmented objective functions as shown in <xref id="x-299b22ddf9e1" rid="disp-formula-group-6fe84e90de8149cabd123cab82979b3e" ref-type="disp-formula">Equation 7</xref> and choosing the minimum value. In <xref id="x-bfcd946639be" rid="disp-formula-group-6fe84e90de8149cabd123cab82979b3e" ref-type="disp-formula">Equation 7</xref>, <inline-formula id="inline-formula-aa50a235613240448e0d8fb634c6264c"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:msub><mml:mi>I</mml:mi><mml:mi>b</mml:mi></mml:msub></mml:math></inline-formula> is the set of observations belonging to <inline-formula id="inline-formula-3a4d6f6acab84d31a1d2543d6ccc7118"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mi>b</mml:mi></mml:math></inline-formula> under splitting rule <inline-formula id="inline-formula-a2efe5822a2e430c9caa8b70f7361e9a"> <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mi>Β</mml:mi></mml:math></inline-formula>  (<xref id="xref-89150a6f3c8f476cb17e292689959690" rid="R253150932180181" ref-type="bibr">Tang &amp; Donnell, 2019</xref>).</p>
        <disp-formula-group id="disp-formula-group-6fe84e90de8149cabd123cab82979b3e"> <disp-formula><label>7</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML"><mml:mi>S</mml:mi><mml:mi>C</mml:mi><mml:mi>O</mml:mi><mml:mi>R</mml:mi><mml:mi>E</mml:mi><mml:mo>=</mml:mo><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>b</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>B</mml:mi></mml:munderover><mml:munder><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>∈</mml:mo><mml:msub><mml:mi>I</mml:mi><mml:mi>b</mml:mi></mml:msub></mml:mrow></mml:munder><mml:mi>Ψ</mml:mi><mml:mfenced><mml:mrow><mml:msub><mml:mi>Y</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mi>θ</mml:mi><mml:mi>b</mml:mi></mml:msub></mml:mrow></mml:mfenced></mml:math></disp-formula></disp-formula-group>
        <p id="paragraph-e1c0e9da463444efa8eae64f5039dd69">The process outlined above results in child nodes after the splitting rule is followed. The process is then repeated on all child nodes until terminal nodes are reached, where there is no longer coefficient instability as determined in Step 2 of the process. Each of the terminal nodes represents a parametric model, and any observation in the root nodes that meets the splitting criteria to fall into the terminal node can be predicted using the corresponding parametric model. Additional information about the MBRP algorithm can be found in <xref id="xref-e633f2f0c8824bb295f4b3b2263f03f5" rid="R253150932180207" ref-type="bibr">Zeileis and Hornik (2007)</xref> and <xref id="xref-8b9f8feac4d9472ebb4c2ac4185572a5" rid="R253150932180192" ref-type="bibr"> Zeileis et al. (2008)</xref>. </p>
      </sec>
    </sec>
    <sec>
      <title id="title-342e7c4b8e2742c4bcf4a3743472e994">Data</title>
      <p id="paragraph-d767388e5b4d43c3b8d99bdad7493765">Pedestrian count data analyzed in this study comes from the North Carolina Department of Transportation (NCDOT) and was collected and analyzed for a previous study investigating factors contributing to pedestrian crash outcomes  (<xref id="xref-706e2c4e95514f2f8946ab185ee5e23d" rid="R253150932180182" ref-type="bibr">Gayah et al., 2022</xref>). The counts are not a random sample, arising from a variety of convenience samples such as turning movement counts (TMCs) and pedestrian safety studies at particularly dangerous intersections or intersections with high-volumes relative to other intersections in the city. The non-random sample is still considered to be a valid sample because the counts are known to demonstrate a wide range of pedestrian count values, as well as to accurately represent the expected levels of pedestrian activity near the count location. The counts come from the following sources:</p>
      <list list-type="bullet">
        <list-item id="li-aed96a1fa558">
          <p>1 993 counts collected by NCDOT as part of turning movement counts (TMCs) or other similar analyses</p>
        </list-item>
        <list-item id="li-972ea51d99cc">
          <p>496 counts collected between 2011 and 2020 by City of Charlotte TMC program as part of a FHWA funded research project</p>
        </list-item>
        <list-item id="li-977a2ccbca52">
          <p>19 counts from downtown Raleigh, NC as collected for a NCDOT pedestrian safety study</p>
        </list-item>
        <list-item id="li-f8ee1e2a4146">
          <p>539 counts from Greensboro DOT/Greenville Urban Area Metropolitan Planning Organization (MPO)</p>
        </list-item>
        <list-item id="li-34a25cb49432">
          <p>387 counts provided by Gaston-Cleveland-Lincoln MPO</p>
        </list-item>
        <list-item id="li-8176be0289cc">
          <p>184 counts provided by the City of Durham.</p>
        </list-item>
      </list>
      <p id="paragraph-24e78ea683104778a02a02c81148f454">Each observation in the dataset included vehicular volume data, roadway features at the count location, census-level demographic statistics, and land-use statistics for a 0.5-mile radius surrounding the count location. A summary of the variables that were included in final models is provided in <xref id="x-201c90f59ebc" rid="table-wrap-ad212c92622b40e69ffcc996020fa461" ref-type="table">Table 1</xref> and <xref id="x-9af3805b6897" rid="table-wrap-96652b0dcaf6474a9d4b5de2f9f355e0" ref-type="table">Table 2</xref>. The land use mix variable is an aggregate of land uses in the surrounding area adapted from the methodology outlined in <xref id="xref-33cbcda30637492bbce24003796ae03b" rid="R253150932180188" ref-type="bibr"> Frank et al. (2004)</xref> and <xref id="xref-914658178f3e4b199dd2b67fb7b0d2bf" rid="R253150932180182" ref-type="bibr">Gayah et al. (2022)</xref>. The land use mix value is based on four land use types: high intensity developed, medium intensity developed, low intensity developed, and all other land use classifications combined, where a value of 1.00 represents a perfect balance of all four land uses, and 0.00 represents only a single land use present. Alcohol sales locations are not commonly considered as an indicator variable; however, including this variable in indicator form can be justified through contextualization—the two categories represent the difference between an area with single liquor store and a couple of restaurants, and an area with densely clustered bars expecting high foot traffic and fewer vehicles. Including this variable in this form was found to improve model performance relative to a continuous form of alcohol sales locations.</p>
      <table-wrap id="table-wrap-ad212c92622b40e69ffcc996020fa461" orientation="portrait">
        <label>Table 1</label>
        <caption id="caption-5cefa5f303044152bb31e2ca774b2ea5">
          <title id="title-951a0833a58544c0bb1ac7c01728939c">Continuous variables included in final NB and MBRP models</title>
        </caption>
        <table id="table-08c4366869aa4517b8f2d0622ccdf1fe" rules="rows">
          <colgroup>
            <col width="39.89"/>
            <col width="12.04"/>
            <col width="18.679999999999993"/>
            <col width="15.030000000000005"/>
            <col width="14.36"/>
          </colgroup>
          <thead id="table-section-header-c81522c2395e">
            <tr id="tr-df77e1829902">
              <th id="tc-b060b5cb8da9" align="left">
                <p id="p-e2997e159dd8"/>
              </th>
              <th id="tc-57d502d892b5" align="center">
                <p id="p-d2460d904fae">Mean</p>
              </th>
              <th id="tc-353027e0ad5f" align="center">
                <p id="p-ad20baf7fd46">Standard deviation</p>
              </th>
              <th id="tc-beaf27b8d49d" align="center">
                <p id="p-5201fcad618c">Minimum</p>
              </th>
              <th id="tc-70c5165fc91c" align="center">
                <p id="p-6883ba76d8fa">Maximum</p>
              </th>
            </tr>
          </thead>
          <tbody id="table-section-8e84d7d9db53439eb000ffe46ff602b0">
            <tr id="table-row-1583a444edc640ecb14e52cacd0f60ce">
              <td id="table-cell-1ce35a6e41f143d68cd5e3b6b9849816" align="left">
                <p id="paragraph-550df16f56c1438b93d826caaa39318f">Land use mix </p>
              </td>
              <td id="table-cell-dcc8233576084161a103993b89016203" align="right">
                <p id="paragraph-efd4e47f998649e7b9e6f2e23e8b81d9"> 0.80</p>
              </td>
              <td id="table-cell-d44a0d7a5eae4e6f89db253ab119cef2" align="right">
                <p id="paragraph-9c291c1715e9495ca8990267c8b85652"> 0.17</p>
              </td>
              <td id="table-cell-8f3ef7f51c7345b196bd993bb9fc4624" align="right">
                <p id="paragraph-4bc53502a4ff47e49092a77d720fb49a"> 0.10</p>
              </td>
              <td id="table-cell-8c164246f4614253b309ef2062be84f0" align="right">
                <p id="paragraph-2512dca5a3734953b377fe56cbddf6f7">1.00</p>
              </td>
            </tr>
            <tr id="table-row-b2dd8a3f1aed49f0a36795eee922a19d">
              <td id="table-cell-f735b3c2cf6143ada5d78feefa4755aa" align="left">
                <p id="paragraph-83c64d21ca0342a39cc721307e528611">Proportion of non-motorized commuters within 0.25 miles of count location</p>
              </td>
              <td id="table-cell-22074a38145c456a83970fd6ceda7089" align="right">
                <p id="paragraph-6d9dc9f8b3924a5c8f5bb4667fb0de2c"> 0.07</p>
              </td>
              <td id="table-cell-8e28593bacb9471d993f516da0f398bd" align="right">
                <p id="paragraph-7348b05e4d2a4c60a36b949e5483c3ea"> 0.09</p>
              </td>
              <td id="table-cell-c898353593db4277813fa9cfdfbe6e79" align="right">
                <p id="paragraph-c8042f42c1f84ce39f7b6dde8c750c0d"> 0.00</p>
              </td>
              <td id="table-cell-7c37365a27b5452cb7e281893ab875ef" align="right">
                <p id="paragraph-1766b9e8f93340fdbe4fa0f4409bebc8">0.55</p>
              </td>
            </tr>
            <tr id="table-row-afd7c831624d499dab609d0ea06d20d5">
              <td id="table-cell-37f04b9494b047e19b0e7f8fc8d06c01" align="left">
                <p id="paragraph-cc27589f41f34a5fa9d015a7a2251d8b">AADT (veh/day)</p>
              </td>
              <td id="table-cell-0b712119e6e24d2f8ed4d243f006b319" align="right">
                <p id="paragraph-2bac42bb50fb44b49563d9598d55a500"> 20 260</p>
              </td>
              <td id="table-cell-a2b17caede494e779af878213e2dd21e" align="right">
                <p id="paragraph-2d49175624b14e8ca322c25f040f0079"> 11 133</p>
              </td>
              <td id="table-cell-bf3a755c7db7497d96b6b5e4b628cc41" align="right">
                <p id="paragraph-44f56b067d8646f8a173f4ebb7df473a"> 1 200</p>
              </td>
              <td id="table-cell-14d94d8d06304585a1aba4db27bb8429" align="right">
                <p id="paragraph-0a370499e40c4ea499ea679d59fb191f">77,000</p>
              </td>
            </tr>
            <tr id="table-row-1e6b26c11854442391727bd9ae7ab62b">
              <td id="table-cell-0a90daa3711e4c1393b586ceb3410c01" align="left">
                <p id="paragraph-5ca0e140d4f64598b821046f7039110d">Number of parcels within 0.25 miles of count location (parcel count)</p>
              </td>
              <td id="table-cell-385dac6c5a08433899fadb547aa80db1" align="right">
                <p id="paragraph-7c95ddd3bdee495cbc7417617815436d"> 92.98</p>
              </td>
              <td id="table-cell-4b4654e4f16d482c938fb65ece42467d" align="right">
                <p id="paragraph-418aad91c13b4a91800ea652d56e0569"> 91.93</p>
              </td>
              <td id="table-cell-540bb7f8b5334ccb9c17f191648733c3" align="right">
                <p id="paragraph-2603a4b6671d4ed2a4796bdcb7d8a744"> 2</p>
              </td>
              <td id="table-cell-02f94a77e7b64359a422e6722fb986b8" align="right">
                <p id="paragraph-27e28f051e8941599ecbd9a2223cbdce">568</p>
              </td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <table-wrap id="table-wrap-96652b0dcaf6474a9d4b5de2f9f355e0" orientation="portrait">
        <label>Table 2</label>
        <caption id="caption-75dc95f834094f38b1afc2943339ff70">
          <title id="title-a4c736498d2847c2bbed7967374015b4">Discrete variables included in final NB and MBRP models</title>
        </caption>
        <table id="table-770e7f04238d45a09d27218f2bd96768" rules="rows">
          <colgroup>
            <col width="73.53"/>
            <col width="12.930000000000007"/>
            <col width="13.540000000000001"/>
          </colgroup>
          <thead id="table-section-header-394360293b1a">
            <tr id="tr-812a8e043de8">
              <th id="tc-740ffb94b82b" align="left">
                <p id="p-81b733317433"/>
              </th>
              <th id="tc-5728c0953834" align="center">
                <p id="p-61a092c5aee0">1</p>
              </th>
              <th id="tc-e61d3267b080" align="center">
                <p id="p-c931193e03a2">0</p>
              </th>
            </tr>
          </thead>
          <tbody id="table-section-4a2eeeeb18654d1aa748d9e5a35d208d">
            <tr id="table-row-61488b5032cc49c0b0c9024a143f8504">
              <td id="table-cell-1c32d8992e2e4b808f43d2ad0b7cf446" align="left">
                <p id="paragraph-fafd4250da73438f8b76405018703014">Count duration = 13 hours (1 indicates yes, 0 indicates no)</p>
              </td>
              <td id="table-cell-a64934062cbe47d69dcb20eb84cf6b3a" align="right">
                <p id="paragraph-26d57a6cce044714a24ead8b8eff55e3">74.49%</p>
              </td>
              <td id="table-cell-d0d50117a99444f08186b41ebe090bce" align="right">
                <p id="paragraph-046c5fa0da17405ab9b882cbb16123c0">25.51%</p>
              </td>
            </tr>
            <tr id="table-row-07ea5492ef3649fea50914b486ebf6bb">
              <td id="table-cell-60d4ff147e7a4de5825f1cafb3ef89ad" align="left">
                <p id="paragraph-e18b3d6fb10148138b7dd2f1f2f8caf8">Count duration = 16 hours (1 indicates yes, 0 indicates no)</p>
              </td>
              <td id="table-cell-a9469c7e55264deba5544a54d86590f1" align="right">
                <p id="paragraph-493fe9e706434df38831b170f70f50a8"> 5.27%</p>
              </td>
              <td id="table-cell-3b9794ae23d946cd995310fe9728d050" align="right">
                <p id="paragraph-b72df5ed74dd48b6b2c97ac55a020ba6"> 94.73%</p>
              </td>
            </tr>
            <tr id="table-row-1b51cf8b036f410d9e0810512b9f4a5b">
              <td id="table-cell-00c32999fc0a499093f76de9e2a39ebe" align="left">
                <p id="paragraph-6c588ab00b574e5595cf579f6e72d608">Indicator for 0-5 alcohol sales locations within 0.25 miles of count location (1 indicates yes, 0 indicates no)</p>
              </td>
              <td id="table-cell-79440b9ff1474bf788a4d3eaa1d832a9" align="right">
                <p id="paragraph-9e41ad0487ef40878faf9941a86aef15"> 40.00%</p>
              </td>
              <td id="table-cell-276985f1e0a94753a7aae1c4773b5e7f" align="right">
                <p id="paragraph-896fbb6a1867462b8e4888b8155aacf9"> 60.00%</p>
              </td>
            </tr>
            <tr id="table-row-fc5e6403c9594402927ce28a180e3a60">
              <td id="table-cell-6ac9f0a0a039481c939a8d8c8fff71fa" align="left">
                <p id="paragraph-792acd7f0491473db5c98895b5c48b13">Indicator for ≥ 6 alcohol sales locations within 0.25 miles of count location (1 indicates yes, 0 indicates no)</p>
              </td>
              <td id="table-cell-896cc0c5edc84d4684a4c8378ebb9c55" align="right">
                <p id="paragraph-69adbf80450c4766a4bc486a6a605257"> 29.29%</p>
              </td>
              <td id="table-cell-39a5eb5ba8214cf4a7343dfefdacd9d8" align="right">
                <p id="paragraph-9928f1a03479426f8bd0c33752fccea1"> 70.71%</p>
              </td>
            </tr>
            <tr id="table-row-7d506b4c1acb4f239010e9d4912e2d51">
              <td id="table-cell-ae5629c2ac8a477aafdbaa58fbb1ca78" align="left">
                <p id="paragraph-94a721fc6e4d40c3973944097898b080">Indicator for presence of sidewalk (1 indicates present, 0 indicates not present)</p>
              </td>
              <td id="table-cell-cbaf5933bc6545c2a2cf82558729eebf" align="right">
                <p id="paragraph-4d69496b02314f11b3a697b154a795e3"> 69.88%</p>
              </td>
              <td id="table-cell-6d7f1f898930448cbb536335e72b6368" align="right">
                <p id="paragraph-6353ebb171e5439aad1448859c45599d"> 30.12%</p>
              </td>
            </tr>
            <tr id="table-row-3f99817046594122a5a04c6a9bc4dfdb">
              <td id="table-cell-3ea7e04a1bb044e681670f1b28aec7bd" align="left">
                <p id="paragraph-6ea497155461446688d5d377474cb1c4">Indicator for presence of crosswalk (1 indicates present, 0 indicates not present)</p>
              </td>
              <td id="table-cell-85a31483acc6444dbf8512b003c1700c" align="right">
                <p id="paragraph-28d7d86dfc1f420787f63ecc50a5e03d"> 32.76%</p>
              </td>
              <td id="table-cell-c0333766f9c54cef88efa11e9b7fe20d" align="right">
                <p id="paragraph-7bb9b869bd914708aab4a5b919b959a1"> 67.24%</p>
              </td>
            </tr>
            <tr id="table-row-baab87552f194c00bdae41f4a879ccb5">
              <td id="table-cell-89f0a3b5223d472fa13ac90e5441704a" align="left">
                <p id="paragraph-23aafeb38379462d930327462e622474">Indicator for bus stop located within 0.25 miles of count location (1 indicates present, 0 indicates not present)</p>
              </td>
              <td id="table-cell-e5602c4c61ad47ea96378b61a2c6cbb0" align="right">
                <p id="paragraph-79e1a221f0014580a7c0549e55174d15"> 58.72%</p>
              </td>
              <td id="table-cell-f234ed08f209440ebe669d461a58645a" align="right">
                <p id="paragraph-06e6bfc903b14918aab0f242fac18070"> 41.28%</p>
              </td>
            </tr>
            <tr id="table-row-52c22aea00014ce18b40021972c6c09f">
              <td id="table-cell-fc77300e72554a72ac7728c540d673a4" align="left">
                <p id="paragraph-d2de4b4db1c549b6bd5afe331cfb0956">Indicator variable for posted speed limit ≥ 40mph (1 indicates yes, 0 indicates no)</p>
              </td>
              <td id="table-cell-8c9f357418bb4539b79ec6fce1553e2b" align="right">
                <p id="paragraph-9ee7d524697241f8a41fd90af81e72f2"> 45.68%</p>
              </td>
              <td id="table-cell-8e851b255ea0494ca6c07b2d555c89df" align="right">
                <p id="paragraph-2cc94af249234cc7be74a40afd23cb54"> 54.32%</p>
              </td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <p id="paragraph-14c9ee8c20d2437e98b09150af063809">Of the 3 618 counts provided, the majority were performed at intersections, and therefore intersections were selected as the unit of analysis. Count locations that were not intersections, in non-urban environments, and count durations less than or equal to 2.5 hours or equal to 24 hours were removed from the analysis to limit the analysis to characteristically similar count locations. The remaining 2 430 pedestrian counts ranged from 0 to 14 854 pedestrians over the respective durations, though 75% of counts registered 67 or fewer pedestrians. An 80/20 split was performed over the full 2 430 counts, creating a training dataset (1 942 observations) and a testing dataset (488 observations) such that both the NB and MBRP models would be estimated over the training dataset, and the models’ fitness would be assessed using the goodness of fit statistics based on their predictions over the test dataset. The training and test datasets were selected to be representative samples of the full dataset with approximately equal summary statistics, but each dataset was also vetted to ensure representation of outlier counts. Due to the nature of the outlier counts, exact matches for maximum count values could not be achieved, and the training dataset is known to contain a greater proportion of lower count values because of the higher maximum count but otherwise similar summary statistics. <xref id="x-3600bbc81afe" rid="table-wrap-841928e98b7148d4abafb3f7fd339cf4" ref-type="table">Table 3</xref> shows the summary statistics of the final split datasets.</p>
      <table-wrap id="table-wrap-841928e98b7148d4abafb3f7fd339cf4" orientation="portrait">
        <label>Table 3</label>
        <caption id="caption-a2edcae9f3094646833ad43728fc3324">
          <title id="title-a34b3a21ad354881ae269e2da6243b43">Summary statistics of pedestrian counts</title>
        </caption>
        <table id="table-44f6c9c570e7498eaf230d5e3e10e2e1" rules="rows">
          <colgroup>
            <col width="18.259999999999998"/>
            <col width="12.470000000000002"/>
            <col width="15.77"/>
            <col width="11.39"/>
            <col width="11.879999999999999"/>
            <col width="15.89"/>
            <col width="14.34"/>
          </colgroup>
          <thead id="table-section-header-1a0de7fc69e8">
            <tr id="tr-4edaa14c2afb">
              <th id="tc-52a20985072b" align="left">
                <p id="p-18da30d5b0be"/>
              </th>
              <th id="tc-16bba75ef3ff" align="center">
                <p id="p-fe21e0d84479">Minimum</p>
              </th>
              <th id="tc-ee90150c06ef" align="center">
                <p id="p-0433121f7e96">25th-percentile</p>
              </th>
              <th id="tc-283fa1d512d4" align="center">
                <p id="p-54cb0a645c40">Median</p>
              </th>
              <th id="tc-3aad400157ac" align="center">
                <p id="p-bca313b0e80f">Mean</p>
              </th>
              <th id="tc-68d76cdc9f7f" align="center">
                <p id="p-337c6c15e779">75th-percentile</p>
              </th>
              <th id="tc-26d2816e9d6f" align="center">
                <p id="p-9067b805afd1">Maximum</p>
              </th>
            </tr>
          </thead>
          <tbody id="table-section-9afde699511e41ab9afe796f143ebdd5">
            <tr id="table-row-ca3f8f092b474b4c8f67502f8ad2ff03">
              <td id="table-cell-0ca737034a4d4bd59656ecd65df4d847" align="left">
                <p id="paragraph-1d6bdbad636d47edbb9fd895c8292075">Full dataset</p>
              </td>
              <td id="table-cell-9693670b73784efe875b0206444bb047" align="right">
                <p id="paragraph-81b8d38a0b294d289f37f71058b9bf52"> 0</p>
              </td>
              <td id="table-cell-99a51d67ceaf40b3ae4aca2a56a4ac70" align="right">
                <p id="paragraph-5c442f956abf493d918af09a27e56236"> 4</p>
              </td>
              <td id="table-cell-7f6a67f7f971472da8aa41555dc614eb" align="right">
                <p id="paragraph-1dc6477fe4744be7b7d1ee7e79cf777f"> 19</p>
              </td>
              <td id="table-cell-44970567288448e38ae06e546fa74990" align="right">
                <p id="paragraph-c618e5f952e54032afc4dc786784e4ac"> 145.7</p>
              </td>
              <td id="table-cell-5f386c1f54114bf490e41a97668d0c38" align="right">
                <p id="paragraph-be56ec7581f5496ba85bf3e23380a048"> 67.00</p>
              </td>
              <td id="table-cell-66836572ed5b470ca20dd80a0b282e8a" align="right">
                <p id="paragraph-33855bb5739c4527bb4659c2e2087d5a"> 14 854</p>
              </td>
            </tr>
            <tr id="table-row-4e1335831abb40ba845c80c22700243d">
              <td id="table-cell-8b9333bcd03e47739590459ace3512e0" align="left">
                <p id="paragraph-832d6481ffbb49758a630c84f95dd541">Training dataset</p>
              </td>
              <td id="table-cell-6d97883ea8e34c5691bfaffeaf7718c1" align="right">
                <p id="paragraph-d7318e9505844160bad5887e7abe9e60"> 0</p>
              </td>
              <td id="table-cell-4b354cde0f214272a0ea4206716ce2fd" align="right">
                <p id="paragraph-3696bbfa1702401dbb9c73cbb3aa70b7"> 4</p>
              </td>
              <td id="table-cell-9b1583e82b604eed8f99931592306bc4" align="right">
                <p id="paragraph-cd9ef2ec3e804e63aa5dca4436ee1204"> 19</p>
              </td>
              <td id="table-cell-aa44d053928c4ba4946190c6f60f2dfe" align="right">
                <p id="paragraph-ffd8cd2f97f04eb2bbf1977f4ea93a62"> 146.4</p>
              </td>
              <td id="table-cell-00f68efada9b41049f1249052eb242f2" align="right">
                <p id="paragraph-ddfc274a73f648aaa9aee8748052a9cc"> 67.75</p>
              </td>
              <td id="table-cell-1903ceed03b84a32bc71d83a0b65d004" align="right">
                <p id="paragraph-5371ccc153d748fcafecd9f2bde670c1"> 14 854</p>
              </td>
            </tr>
            <tr id="table-row-34894534d3164b4781b192ae330c1fc8">
              <td id="table-cell-6d286b9a435641c2bc4fe29a56227a5b" align="left">
                <p id="paragraph-c868f12c92a14e5b8f48e4bad1a5f2f9">Test dataset</p>
              </td>
              <td id="table-cell-fc95975e33e14f049cf3c3a3c0752776" align="right">
                <p id="paragraph-d5d8cfa52cf845d6a5d7ddff7b081c3b"> 0</p>
              </td>
              <td id="table-cell-3af5e4ae77eb4ff69a017fff0f32b1f5" align="right">
                <p id="paragraph-2307d6d7fa1e45c4ba5076f9b17de8a1"> 4</p>
              </td>
              <td id="table-cell-4aa901e0a87f4ae189de22929535d1e8" align="right">
                <p id="paragraph-4a3827645074409297b241ce939a66f6"> 19</p>
              </td>
              <td id="table-cell-0987c65bf62446439213a653515fc83c" align="right">
                <p id="paragraph-0d249f9a8b87421898d6d553d654505d"> 143.0</p>
              </td>
              <td id="table-cell-e74efc70a0bf46df9c3d1b93f49f4810" align="right">
                <p id="paragraph-2799757ceeec41dfbf056baa8837ac4d"> 65.50</p>
              </td>
              <td id="table-cell-62a32570007d4d9aaa1535a1ffa50c29" align="right">
                <p id="paragraph-0b6ecc60f2c64a64990f5a921c63a69f"> 9 839</p>
              </td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
    </sec>
    <sec>
      <title id="title-8c1785d9023c4996aa951d57305dd889">Analysis and results</title>
      <p id="paragraph-cb57a499243a45d0832fd7901e1743b8">This section describes the estimation results from the NB regression model and the MBRP model, including the assessments of goodness of fit through mean absolute error<bold id="strong-d66f2282db5343d397b130851a8309f1"> (</bold>MAE<bold id="strong-824f40f17636452f82404e25726dd651">)</bold>,<bold id="strong-d021d3e82b1f4673adb63921802fb3ec"> </bold>mean absolute percentage error <bold id="strong-a4565a66989e4a7298116d3bf24e2a22">(</bold>MAPE<bold id="strong-cf4a9feb35a04fcebf6d91ca77b7b1e1">)</bold>, and root mean square error<bold id="strong-34b89bb1b8dd42b9ac21e47a7fcd35fa"> (</bold>RMSE<bold id="strong-fa4ad46e0549444f818f4916962a53db">)</bold>. Additionally, a cumulative residual<bold id="strong-41cf6a34ccc34190a5ee76371d9e03f9"> (</bold>CURE<bold id="strong-c5ec724c1b4b4ec2bc75b2eac4e2bde1">)</bold> plot was generated with both models plotted against the 95-percent confidence interval as determined for the NB regression model, according to the methodology outlined in <xref id="xref-6c2aab758c4949919a1e0c60fc6a78f5" rid="R253150932180190" ref-type="bibr">Hauer (2015)</xref>.</p>
      <p id="paragraph-a0b8255b19bd461eab2ee12fcdabf084">The results of the MLE process for the NB regression model and the model generated from the MBRP algorithm are presented in <xref id="x-b819c82b1e7d" rid="table-wrap-cc7a640115ce47e2aaedc14182433222" ref-type="table">Table 4</xref>. In the modeling process, only the variables found to be statistically significant at the 5% significance level were retained. Exceptions were made for some variables found to be insignificant at the 5% level but were deemed theoretically important predictors of pedestrian counts. Additionally, any variables that were found to be inconsistent with theory regarding the sign of the estimated parameter were vetted for their contribution to the model’s predictive performance before being considered for removal.</p>
      <table-wrap id="table-wrap-cc7a640115ce47e2aaedc14182433222" orientation="portrait">
        <label>Table 4</label>
        <caption id="caption-fb9818bc0e9d4433ba0207a3cf09cce3">
          <title id="title-b9d9164354bd43fe902a6257a7af922d">NB regression and MBRP model estimation results</title>
        </caption>
        <table id="table-628c73e65084411b93837df59a8fb565" rules="rows">
          <colgroup>
            <col width="46.10000000000001"/>
            <col width="15.479999999999997"/>
            <col width="18.79"/>
            <col width="19.63"/>
          </colgroup>
          <thead id="table-section-header-b0d4af3ca42b">
            <tr id="tr-cb45cf74d348">
              <th id="tc-0a688ee5a7dd" rowspan="2" align="left">
                <p id="p-420904c396a5">Variable</p>
              </th>
              <th id="tc-341b426f0bd2" rowspan="2" align="center">
                <p id="p-f6c8e091dc6f">NB regression</p>
              </th>
              <th id="tc-3fd0f87debcc" colspan="2" align="center">
                <p id="p-f919757fe064">MBRP</p>
              </th>
            </tr>
            <tr id="tr-339a4bf65502">
              <th id="tc-c65139586138" align="center">
                <p id="p-afe36aa5555d">Parcel count ≤ 71</p>
                <p id="p-af7ee5a74fc3">‘Low urban density’</p>
              </th>
              <th id="tc-830c24ae8446" align="center">
                <p id="p-53248fc95f34">Parcel count &gt; 71</p>
                <p id="p-346e072594f5">‘High urban density’</p>
              </th>
            </tr>
          </thead>
          <tbody id="table-section-832f14e52cb5498e818ca4386dff92c6">
            <tr id="table-row-549213bbe141480c9a14c6ed170fb1ae">
              <td id="table-cell-6478452316524e789c82760ff19c4d43" align="left">
                <p id="paragraph-291740d0fb1b48db8c7dae87d221f206">Constant</p>
              </td>
              <td id="table-cell-7dd3ab350cd24b4bb6cffe6c2d400281" align="right">
                <p id="paragraph-75d306b9e053494dbe3d9f3124ab69cd">2.538</p>
              </td>
              <td id="table-cell-c259e239925f4c219b0961fc3faf4575" align="right">
                <p id="paragraph-0a471a5c0f5343cab8933191e00ff164"> 3.226</p>
              </td>
              <td id="table-cell-6712d45a95a44f80a2b927d16eb65fe7" align="right">
                <p id="paragraph-4858fbdb008941fd8dd27abc60e93457"> 4.926</p>
              </td>
            </tr>
            <tr id="table-row-0ba5acbdac9f4e219d63913521748a42">
              <td id="table-cell-03fba23cae684ea48cc145047a38f5bb" align="left">
                <p id="paragraph-317f4bb3166048d1833ce28cd5f9fb8f">Count duration = 13 hours (1 indicates yes, 0 indicates no)</p>
              </td>
              <td id="table-cell-6a8a2a11900f4c43834eab71dd0b4515" align="right">
                <p id="paragraph-7499ff76d7424b0e93da0ad433e17c18">0.428</p>
              </td>
              <td id="table-cell-8757a2cf178c44ec8ddf382a4885252e" align="right">
                <p id="paragraph-f2a1f06844eb431c9bf1a355486c4fed"> 0.747</p>
              </td>
              <td id="table-cell-5666f533d22a4a1fafa9d6656809683a" align="right">
                <p id="paragraph-bc970c7cdc394eb7aa5fd10cf9a13be7"> 0.293</p>
              </td>
            </tr>
            <tr id="table-row-337cb7b180414053a0e1487d5185c102">
              <td id="table-cell-a722e7e9d48e465782bebfcaaf69b817" align="left">
                <p id="paragraph-6eddab4380c14783ab9b1a350d59ded9">Count duration = 16 hours (1 indicates yes, 0 indicates no)</p>
              </td>
              <td id="table-cell-25e3d7dc887c45acbd50554c73213248" align="right">
                <p id="paragraph-b940220e5deb47cea4fcb369cf934333">-0.408</p>
              </td>
              <td id="table-cell-0b3559ea68454308827092ed32b18062" align="right">
                <p id="paragraph-4d40ac06f9114a35b6b051e87ae2ce73"> <italic id="e-078f9799c473">0.078</italic></p>
              </td>
              <td id="table-cell-95364c6a726944e58da6f01fc4dd7f47" align="right">
                <p id="paragraph-5fb17fe412e946f3b8baf5fd9ef96bdf"> -0.965</p>
              </td>
            </tr>
            <tr id="table-row-977812d045064cacb3dc3b25b6254071">
              <td id="table-cell-c98c4025371f425fa7c7172a642e68b6" align="left">
                <p id="paragraph-75ab4a38d5814f868b8ba94cc5fcb4f8">Land use mix</p>
              </td>
              <td id="table-cell-aba2d84ed310451b9b0a867fedb4a3c1" align="right">
                <p id="paragraph-d6ed1bff847948a19f0a5e157fa4a759"> 1.265</p>
              </td>
              <td id="table-cell-9c8e217592d14047b51923b6e98c6b71" align="right">
                <p id="paragraph-094cac7ec67c45d78076d40ba40f5e2e"> ---</p>
              </td>
              <td id="table-cell-e2d9f2cde78349ab93b05a372a7fe174" align="right">
                <p id="paragraph-b667def7d81346ae85a82fc40f8be4b9"> ---</p>
              </td>
            </tr>
            <tr id="table-row-d286eb0727524bd1ba6fd15613b63329">
              <td id="table-cell-e856c0ef0b8546d381f47225386e2e46" align="left">
                <p id="paragraph-11a7fca6f47e485b8e29fc9a9a75de41">Indicator for 0–5 alcohol sales locations within 0.25 miles of count location (1 indicates yes, 0 indicates no)</p>
              </td>
              <td id="table-cell-959e730578d841c885dc1cc4378cb27d" align="right">
                <p id="paragraph-2392d5cb4985424a8354496337ea9b6c"> 0.172</p>
              </td>
              <td id="table-cell-f089f42afd074877a28cc5c2d71f4de9" align="right">
                <p id="paragraph-be33dc0b121d4b94b2e4396b119104fe"> <italic id="e-c328513589fc">0.210</italic></p>
              </td>
              <td id="table-cell-2bc2d7f29ea742d2bd4a2af08bf9075b" align="right">
                <p id="paragraph-60bd3d779d1f4df5a361de32460fc2aa"> 0.603</p>
              </td>
            </tr>
            <tr id="table-row-c71cec9019fd4d239a062f8ece9aa580">
              <td id="table-cell-efe1a1d2d54c46748a3769306880ceca" align="left">
                <p id="paragraph-82379d82de86436299ad47e410caa7d4">Indicator for ≥ 6 alcohol sales locations within 0.25 miles of count location (1 indicates yes, 0 indicates no)</p>
              </td>
              <td id="table-cell-06b8c29902e74cd9ad629daa0830f42e" align="right">
                <p id="paragraph-e4c97bd860d6451f8cfa9eaa9e77a6cc"> 0.680</p>
              </td>
              <td id="table-cell-ce94953658c34bcdac22fb47dfb31a71" align="right">
                <p id="paragraph-76dc0a152b034af49020f0b97e5b5a5f"> 0.743</p>
              </td>
              <td id="table-cell-3d6454827c4544c5b1f9339925f5764e" align="right">
                <p id="paragraph-d406f504f0284a79b32b27e355750ee4"> 1.054</p>
              </td>
            </tr>
            <tr id="table-row-fdca11cc57f14f3e8ed5f6606b48c43e">
              <td id="table-cell-a0ebd1a0381c447eb266e0c36ec658d5" align="left">
                <p id="paragraph-ce29b63d4d5f4064af90d1dfb4b84ff4">Proportion of non-motorized commuters within 0.25 miles of count location</p>
              </td>
              <td id="table-cell-6f4e536a1959479eb661c5d51ea83bd3" align="right">
                <p id="paragraph-26e4d1fdf1f54dcca3b759352b5111ad"> 9.262</p>
              </td>
              <td id="table-cell-5292db3672054dd3a49909f16aea8c78" align="right">
                <p id="paragraph-4bd5eb3f0cad4b0c9a7a982785b8b55b"> 8.958</p>
              </td>
              <td id="table-cell-c31d4b3a8fda48349ebc9e54bd53d208" align="right">
                <p id="paragraph-f81f6edf67a24ff6a6940fc37bc48b9e"> 9.009</p>
              </td>
            </tr>
            <tr id="table-row-a76ddba1bf694b2e9e4448f6e496eabe">
              <td id="table-cell-87f9e1f2a5e247c8967b1b859a159357" align="left">
                <p id="paragraph-b5e713252c9043fd9e99fa9d20a848c1">Natural logarithm of AADT (veh/day)</p>
              </td>
              <td id="table-cell-6d4782fd2ac14029ba0659cbe70bfbc3" align="right">
                <p id="paragraph-5b5f1a1d0d0342c2b455de5cfc7e1b3a"> -0.301</p>
              </td>
              <td id="table-cell-4ebeae178d6e4fb1b120e30cd0c03720" align="right">
                <p id="paragraph-fbd9674211384b9a888918f63f89d24f"> -0.228</p>
              </td>
              <td id="table-cell-c29a518596904cd1b7e9af339b07f363" align="right">
                <p id="paragraph-d1c57b758b874265990b4959f7f5695e"> -0.260</p>
              </td>
            </tr>
            <tr id="table-row-e7802c12da064fb79b6621fc2f333718">
              <td id="table-cell-9acdef08d85241afadb50abffaf20682" align="left">
                <p id="paragraph-a64cd85bb4bd4d6a935305e9a41254a1">Indicator for presence of sidewalk (1 indicates present, 0 indicates not present)</p>
              </td>
              <td id="table-cell-6be47f793a674675b61c397c40905f24" align="right">
                <p id="paragraph-bceb988cbb8c43b79dfdb23eca2647eb"> 0.972</p>
              </td>
              <td id="table-cell-6b8bb62a22d448a18495e914e39d5fc7" align="right">
                <p id="paragraph-f583a43cbd4841418251cf1275e6fd33"> 1.046</p>
              </td>
              <td id="table-cell-b1837730da0348918b58bf8d9275a87e" align="right">
                <p id="paragraph-35c19b14b53e4d8981de7275598ad0e5"> 0.696</p>
              </td>
            </tr>
            <tr id="table-row-a0ce3ab93d934661a03bfaa3a8249c6f">
              <td id="table-cell-82678433a7054089b0d6ac89f3bfd4fb" align="left">
                <p id="paragraph-a3bccacf59c544b89d4d2b72b23c24a6">Indicator for presence of crosswalk (1 indicates present, 0 indicates not present)</p>
              </td>
              <td id="table-cell-93aabd75b54a4a3ca83da343480b6cbc" align="right">
                <p id="paragraph-d4ba89ebaf4748e2923d8c596cdcf493"> 0.576</p>
              </td>
              <td id="table-cell-46baae2c5a564b7eb8ac7baeeada0833" align="right">
                <p id="paragraph-125f19abc61644e8a2af5643340fa55e"> 1.019</p>
              </td>
              <td id="table-cell-c52a0203eced47eeb6a2aa9b940fc019" align="right">
                <p id="paragraph-fa6dac1b89024fd68e1144c438b5edbe">
                  <italic id="e-d2219b961bec"> -0.089</italic>
                </p>
              </td>
            </tr>
            <tr id="table-row-a02d18f3187e46beba62c205425ed47d">
              <td id="table-cell-7b893a2866b8457eb3f3c91170ad0130" align="left">
                <p id="paragraph-b0ec0b264575428aaf5f2719767f37ad">Indicator for bus stop located within 0.25 miles of count location (1 indicates present, 0 indicates not present)</p>
              </td>
              <td id="table-cell-cc30fa96e77846f1a5820abc8e84ed47" align="right">
                <p id="paragraph-15697607a49f459e8a6c14db08bfa41a"> 0.214</p>
              </td>
              <td id="table-cell-b70b5248919946089ae56a69033ddef6" align="right">
                <p id="paragraph-8edb7e422ff3492b834bee3ee241abdc"> 0.418</p>
              </td>
              <td id="table-cell-199a9eeaf4fc45c7bd0bb74f1da5da8b" align="right">
                <p id="paragraph-293a2ad51dc346bfa3510eb8a4849921"> <italic id="e-d6c265c75685">0.008</italic></p>
              </td>
            </tr>
            <tr id="table-row-96f5f94bc5ec44f69b54af9a0ce4ce3c">
              <td id="table-cell-8d5ca14040b24e9794145992b69a1330" align="left">
                <p id="paragraph-7d4785225ef641b6ad62680cab34c2cd">Natural logarithm of parcel count</p>
              </td>
              <td id="table-cell-a5424b9b2e82432db5115e078a3b0dc3" align="right">
                <p id="paragraph-38be6359159146559cff95b9a89316c4"> 0.262</p>
              </td>
              <td id="table-cell-e1e176984579407dbb4dc11089aca5ab" align="right">
                <p id="paragraph-5e82b3c3dfe1492cad17d294892d0a24"> ---</p>
              </td>
              <td id="table-cell-71369ecd06cf4fc28f7f79fbf62edadc" align="right">
                <p id="paragraph-3c5401f1642440e39dcf385cd94b1eb6"> ---</p>
              </td>
            </tr>
            <tr id="table-row-41755e749b454edaa60fb568eb306a1f">
              <td id="table-cell-257b8d9f1c154fe1931600fa32afe84b" align="left">
                <p id="paragraph-26c7ed929a1841fa98550ea5fecd0c24">Indicator variable for posted speed limit ≥ 40mph (1 indicates yes, 0 indicates no)</p>
              </td>
              <td id="table-cell-5b224e951b534362aca8403f622d3e22" align="right">
                <p id="paragraph-95d3309601f44527958e9f748ac43c56"> -0.636</p>
              </td>
              <td id="table-cell-91c4935ea6b74a4d893689f29d4dc59d" align="right">
                <p id="paragraph-6210007232724b71b8f2f8881979e1cd"> -0.746</p>
              </td>
              <td id="table-cell-922025298af14390866e6e297ac7560c" align="right">
                <p id="paragraph-eebbc258a6d44fe7a3fbce2273c7c682"> -0.381</p>
              </td>
            </tr>
            <tr id="table-row-28a8a3eab8004afcb405393ddd330527">
              <td id="table-cell-d3fcf9b430c04ba291c47e96c9aab839" align="left">
                <p id="paragraph-303a1d85e5184409b92120f23afa077a">Overdispersion parameter</p>
              </td>
              <td id="table-cell-a7eae5fee00d49a68f28afbb301995fc" align="right">
                <p id="paragraph-1dfb592d919943c9a833787f68f5d4f5"> 1.550</p>
              </td>
              <td id="table-cell-05e61e65ab004802a4f3abd198fc1b70" align="right">
                <p id="paragraph-8ad4d6c5d086446081f4aeb405a83e2d"> 2.435</p>
              </td>
              <td id="table-cell-80d24c6f952148928ec085536fd44313" align="right">
                <p id="paragraph-331c24b700ad4dc09618b0970d3db6a6"> 1.226</p>
              </td>
            </tr>
            <tr id="table-row-32e37b9b1b2241b5a9c5f032d0f05aae">
              <td id="table-cell-926025ef59c942719b71206ae0c9a892" align="left">
                <p id="paragraph-c79b54bf4fe340babefd63c520342993">Akaike Information Criterion (AIC)</p>
              </td>
              <td id="table-cell-8f0407d2fdee43da99390083416cf088" align="right">
                <p id="paragraph-33241c48a6654294ade901866c227329"> 17 889</p>
              </td>
              <td id="table-cell-4723113f8c9a483ab90c626a7035c411" colspan="2" align="center">
                <p id="paragraph-f24862a895f24e74a54ab35300433a65"> 17 857</p>
              </td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn-group>
            <fn id="f-ce01a28a85d9">
              <p id="p-20ad5318a99e">Values in italics are<bold id="strong-654f24629de047ebb9ca418ad18b2a69"> </bold>not significant at 95% confidence level. </p>
            </fn>
          </fn-group>
        </table-wrap-foot>
      </table-wrap>
      <sec>
        <title id="title-51d8e00040534809b7cc2099e90aa0e8">NB regression</title>
        <p id="paragraph-3912e61dc8bc42819cab4e1eed5f365c">All variables included in the final NB regression model were found to be statistically significant at the 95% confidence level or higher and were found to meet expectations consistent with engineering judgement:</p>
        <list list-type="bullet">
          <list-item id="li-6c91f25ed86d">
            <p><bold id="s-7029b6776fe8">Count duration.</bold> In the dataset, the base condition is a 12-hour count. Therefore, it would be expected that a 13-hour count would yield a higher prediction due to a longer period for pedestrians to be observed. The same logic would indicate that a 16-hour count parameter should be greater than the 13-hour count parameter, however, 16-hour counts are typically conducted at two-way stop intersections being considered for signalization. Generally, these intersections have high traffic volumes which make pedestrian access uncomfortable, resulting in fewer pedestrians. Therefore, a smaller or even negative coefficient may be appropriate to describe the effects of a 16-hour count on pedestrians observed.</p>
          </list-item>
          <list-item id="li-d52616f8fb38">
            <p><bold id="s-8b0bb0bba655">Traffic conditions.</bold> As previously described, pedestrians are less comfortable walking near roadways with higher traffic volumes where they may be more vulnerable to crashes  (<xref id="xref-31733b0ae97a423c9710c4f2ba9ede67" rid="R253150932180194" ref-type="bibr">Miranda-Moreno &amp; Fernandes, 2011</xref>). That trend extends also to roadways with higher speed limits as crashes involving pedestrians and vehicles moving at higher speeds are known to result in more severe outcomes for pedestrians  (<xref id="xref-2dae1013ef0e4f23be35b6cd002d5156" rid="R253150932180189" ref-type="bibr">Pulugurtha &amp; Repaka, 2008</xref>). In the NB regression model, we find that the coefficients associated with the natural logarithm of AADT and speed limits greater than or equal to 40 miles per hour are negative, indicating a negative impact on pedestrian counts.</p>
          </list-item>
          <list-item id="li-60def205f21f">
            <p><bold id="s-6a337bd96c69">Pedestrian-friendly infrastructure.</bold> Presence of features such as crosswalks and sidewalks are expected to contribute positively to pedestrian counts. Crosswalks provide priority to pedestrians crossing at intersections, and sidewalks provide a separate right of way for pedestrians to walk safely next to a road  (<xref rid="R253150932180204" ref-type="bibr">Lee et al., 2019</xref>; <xref rid="R253150932180195" ref-type="bibr">Lu et al., 2018</xref>). These expectations are met by the positive coefficients associated with presence of a crosswalk or sidewalk in the NB regression model. Bus stops are also associated with greater pedestrian presence due to the access distance between the trip origin/destination and the transit stop  (<xref rid="R253150932180193" ref-type="bibr">Hankey et al., 2012</xref>; <xref rid="R253150932180189" ref-type="bibr">Pulugurtha &amp; Repaka, 2008</xref>).</p>
          </list-item>
          <list-item id="li-6596ece61cef">
            <p><bold id="s-8f66b7ce4281">Land development.</bold> Denser, more varied use of land is expected to result in greater pedestrian counts due to convenience of the walking mode. Increases in parcel count, a measure of urban density, should indicate shorter distances to potential destinations, while land use mix increases suggest a greater variety of residential, commercial, and industrial uses within a small radius  (<xref id="xref-f38dabf6ab0a44bbb26812fb6a1b9072" rid="R253150932180182" ref-type="bibr">Gayah et al., 2022</xref>). Walking becomes more convenient over shorter distances, and therefore more pedestrians are likely to be observed with greater parcel count and land use mix. Additionally, alcohol sales locations are frequently accessed via walking due to the dangers associated with driving under the influence  (<xref id="xref-ae07062031744a74a2044cbed5e97c42" rid="R253150932180182" ref-type="bibr">Gayah et al., 2022</xref>).</p>
          </list-item>
          <list-item id="li-dda880edb39f">
            <p><bold id="s-2c12737fe1a1">Demographics.</bold> People who reported that they commute by non-motorized means are vastly more likely to be observed in a pedestrian count, and therefore a greater proportion of non-motorized commuters is expected to increase pedestrian counts, as observed by the positive coefficient in the NB regression model  (<xref id="xref-81e17b0b8efd4ebc90277671c18ef1ae" rid="R253150932180200" ref-type="bibr">Griswold et al., 2019</xref>).</p>
          </list-item>
        </list>
      </sec>
      <sec>
        <title id="title-44a9eafd5c4b4527b4354d890e088386">MBRP model</title>
        <p id="paragraph-fb21a89965164439872cfeb42080fb58">Under the framework discussed in the methodology section, a MBRP model splitting over the natural logarithm of parcel count was developed. Due to the relatively small dataset, the maximum depth of the tree structure was limited to ensure that each of the sub-models was trained on a sufficiently large dataset. This also allowed for greater control over variable inclusion based on statistical significance and consistency with theory. The optimal split value of the parcel counts was found to be 71, with 1 197 of the training dataset observations registering parcel counts less than or equal to the optimal split value. <xref id="x-a15fc81e392d" rid="figure-0abe0f3afef04f118a4875d3ac587256" ref-type="fig">Figure 2</xref>  depicts the tree structure for the MBRP model developed.</p>
        <fig id="figure-0abe0f3afef04f118a4875d3ac587256" orientation="portrait" fig-type="graphic" position="anchor">
          <label>Figure 2 </label>
          <caption id="caption-991f5082857248be89202b0ccfae5907">
            <title id="title-edb1fd8ce7414dc9886e8cc629864c17">MBRP model tree structure</title>
          </caption>
          <graphic id="graphic-11d1eb645dce43a6a057d3f044ad0881" xlink:href="https://typeset-prod-media-server.s3.amazonaws.com/article_uploads/b4c20676-0003-47f6-98f8-f54dc3dd1e1b/image/5d5d5403-0dfe-4206-9618-dc821ba64874-ufigure-2.jpg"/>
        </fig>
        <p id="paragraph-4649823e595d4c62a435214b1182e627">In comparing the estimation results between the NB regression model and the MBRP model, land use mix was found to be statistically insignificant in the MBRP model and was therefore removed from the model. The indicator variables for crosswalks and bus stops were found to be insignificant in the higher urban density model of the MBRP model, though the coefficient for bus stops was consistent with theory, and the contribution from the crosswalk variable was minor enough to overlook given the magnitude of its contribution in the lower urban density model. Aside from these differences, the NB and MBRP model coefficients take the same signs and indicate the same relationships between explanatory variables and pedestrian count outcomes.</p>
        <p id="paragraph-0e99d0bff52845fc88823a0ae5e262a6">The MBRP model allows for additional interpretation of model coefficients between the sub-models, which captures the difference in relationships between the explanatory features and the pedestrian count outcome as they vary with urban density. For example, based on differences in the magnitudes of coefficients presented in the second and third columns of <xref id="x-f60f44705e4c" rid="table-wrap-cc7a640115ce47e2aaedc14182433222" ref-type="table">Table 4</xref>, we observe that pedestrian counts are more sensitive to the presence of alcohol sales locations in denser urban environments. On the other hand, pedestrians in denser urban environments are less sensitive to the presence of sidewalks, crosswalks, bus stops, and greater speed limits than their counterparts in less dense urban areas. Across all models, the coefficients estimated for the proportion of non-motorized commuters and the natural logarithm of AADT are approximately equal, which indicates that pedestrians everywhere are about as sensitive to both variables, regardless of urban density.</p>
      </sec>
      <sec>
        <title id="title-8a50965efc0c4eedbb70816761ac1184">Model comparison</title>
        <p id="paragraph-e19e762348e04f53b2ebf1f7e61742c5">Following model development, both models' cumulative residuals were evaluated over the testing dataset. The results were plotted on a CURE plot (<xref id="x-05f21611eb43" rid="figure-b44c76cfe24d4487bdbf91d55a611914" ref-type="fig">Figure 3</xref>) with the 95% confidence interval from the NB regression plotted to demonstrate how the MBRP model compares to the ‘baseline’ NB regression model. Overall, we can tell that both models are robust, plotting nearly all observations within the confidence interval. From the CURE plot, we see that for lower count values predicted, the cumulative residuals are about equal across both models. Both models appear to underpredict observations of approximately 200 pedestrians, though the residuals for the MBRP model are smaller. The trend of smaller residuals can be observed over most of the predicted range for the MBRP model, indicating a generally better fit for the data than the NB regression model.</p>
        <fig id="figure-b44c76cfe24d4487bdbf91d55a611914" orientation="portrait" fig-type="graphic" position="anchor">
          <label>Figure 3 </label>
          <caption id="caption-52ecef7e618c446da4251d691b3a2bc1">
            <title id="title-1707f0f5e62f460a8f5ef1546f11d17e">
              <bold id="strong-58827af132464f49a4238dfe3edf1259"/>
              <bold id="strong-78da0548f4764081b8bfc08ca5c80d94">Test data cumulative residual plots</bold>
            </title>
          </caption>
          <graphic id="graphic-dc5c8f3773524f35b7fae32608a5f31a" xlink:href="https://typeset-prod-media-server.s3.amazonaws.com/article_uploads/b4c20676-0003-47f6-98f8-f54dc3dd1e1b/image/0cadd133-2d2b-4b37-a9a8-7ec1a80b3a69-ufigure_3.png"/>
        </fig>
        <p id="paragraph-fb505c046c7d4b0490231d323de25e28">The models were also tested for goodness of fit by standard error measurements to determine how well the models predict the pedestrian counts relative to the observed pedestrian counts in the test dataset. <xref id="x-abb951646455" rid="table-wrap-a70dd15f02bd4a1f8d06ae14d0e05f98" ref-type="table">Table 5</xref> presents the goodness of fit statistics for both models, where the better performance measure is bolded. To better depict the differences between the models, the goodness of fit statistics are presented for arbitrarily determined low-, mid-, and high-count ranges, as well as over the entire test dataset. Due to the nature of MAPE and the presence of zero-count observations, MAPE could not be applied to the low-count range, nor the full test dataset. In other studies, MAPE has been applied to zero-count locations through either log-transformation or by adding a negligibly small value to zero-counts. In this case, neither<bold id="strong-6bccdf26ab224ddb9db457c3694dcc04"> </bold>adjustment was applied to avoid artificially inflating the percentage error of zero-counts, for which any predicted<bold id="strong-3f3f288f36bc4c3fb9d9d3e020b5aff3"> </bold>value other than zero would incur immense errors. </p>
        <table-wrap id="table-wrap-a70dd15f02bd4a1f8d06ae14d0e05f98" orientation="portrait">
          <label>Table 5</label>
          <caption id="caption-74162a76e35c4eecaec34949e83ffb9b">
            <title id="title-1c4798b2147f400b9d7c8245cdaad940">Goodness of fit statistics</title>
          </caption>
          <table id="table-a50fe366855f4defa7ede9351d63eb47" rules="rows">
            <colgroup>
              <col width="10.45"/>
              <col width="11.55"/>
              <col width="10.45"/>
              <col width="11.55"/>
              <col width="12.190000000000001"/>
              <col width="9.809999999999999"/>
              <col width="12.1"/>
              <col width="9.9"/>
              <col width="12"/>
            </colgroup>
            <thead id="table-section-header-36a0c954a638">
              <tr id="tr-a1281c7ed8c8">
                <th id="tc-d529f337e154" align="left">
                  <p id="p-b18f824af570"/>
                </th>
                <th id="tc-c09ea2a54450" colspan="2" align="center">
                  <p id="p-24c380435465">Low-Count (0–100)</p>
                  <p id="p-487686488005">(393 observations)</p>
                </th>
                <th id="tc-19c894df6cc9" colspan="2" align="center">
                  <p id="p-22349642843c">Mid-Count (101–1000)</p>
                  <p id="p-ec78f5ac5142">(82 observations)</p>
                </th>
                <th id="tc-f41cb818e6e6" colspan="2" align="center">
                  <p id="p-db4a864b2cc4">High-Count (1000+)</p>
                  <p id="p-413acb987553">(13 observations)</p>
                </th>
                <th id="tc-c783233da2f3" colspan="2" align="center">
                  <p id="p-88cf4c8668a5">Full Test Dataset</p>
                  <p id="p-43facab76cde">(488 observations)</p>
                </th>
              </tr>
            </thead>
            <tbody id="table-section-bdb3bd53747049b18b83fce0e254a467">
              <tr id="table-row-3464da4a85714f2980ddf08c6bb58bdc">
                <td id="table-cell-4d37c4a379c3" align="left">
                  <p id="paragraph-165f32d4f909"/>
                </td>
                <td id="table-cell-96250deeb17643e6a22291c424a01b0b" align="right">
                  <p id="paragraph-5362d75d85d243e0afacd600a74cd02c">NB</p>
                </td>
                <td id="table-cell-64b046ae35074f55bf1ea5965e71571f" align="right">
                  <p id="paragraph-4acaf2dde85541e5ac80e217b1ec5e2c">MBRP</p>
                </td>
                <td id="table-cell-1cc1b54d3a3a441485909ee70fdfffe7" align="right">
                  <p id="paragraph-74ace6a1733e499fa1b3b5609b77aacc">NB</p>
                </td>
                <td id="table-cell-a8343c13f75b44cda4e3e3d2ad22e397" align="right">
                  <p id="paragraph-ff6b4583f1734238aaafcc38528e204c">MBRP</p>
                </td>
                <td id="table-cell-2278b02bff56490093a304dedbe47a20" align="right">
                  <p id="paragraph-167af0d67df942e5849f923cce43558d">NB</p>
                </td>
                <td id="table-cell-a681fc78f1b24dcfb58e1ac185b89ac0" align="right">
                  <p id="paragraph-ee5429b4dd7f4951877fb802e4bca95c">MBRP</p>
                </td>
                <td id="table-cell-d4da298d5d84408689fb763732003764" align="right">
                  <p id="paragraph-488732f08c00488e950fd12e13ac5770"> NB</p>
                </td>
                <td id="table-cell-1f1a507a6ee24dbcbed012aef7eb9193" align="right">
                  <p id="paragraph-bba666f1d74d4565a8e4c69779cdcb0d"> MBRP</p>
                </td>
              </tr>
              <tr id="table-row-4274da474a96459aab3a3af9b3f55c0b">
                <td id="table-cell-a626a26cc7c04e1ebb870c24af9c68f7" align="left">
                  <p id="paragraph-6b237b8e845841549361aecfa476df68">MAE</p>
                </td>
                <td id="table-cell-11f4949f8cec41308b20fda0b54e2071" align="right">
                  <p id="paragraph-9d33fd82c7184d59a7232e94f3084b74"> 47.40</p>
                </td>
                <td id="table-cell-9f5bea7706a0456f91a163eeb89a9253" align="right">
                  <p id="paragraph-bdcc914ed4864507bd16bba13a1407ca"> <bold id="strong-838a7a46b41b4f60a11df17b845062fa">40.78</bold></p>
                </td>
                <td id="table-cell-5fd29ef0044f4d148a6e9d5d6d1112bd" align="right">
                  <p id="paragraph-54e07e51c2aa42fe903c0818733bc970"> 256.10</p>
                </td>
                <td id="table-cell-502fe20a342146fb9e5a265fcbc93b3f" align="right">
                  <p id="paragraph-5eb64a7b7ea740eb9c5d6edae9688ce5"> <bold id="strong-639985457f2d4aa2abd272c35d8ffaa0">245.99</bold></p>
                </td>
                <td id="table-cell-f50bc839f57949d7bfb573235206417e" align="right">
                  <p id="paragraph-91c1e8dc882f4326ae247c767ba43aef"> 2116.33</p>
                </td>
                <td id="table-cell-0f921851d45c4f8696f8cef2d6959441" align="right">
                  <p id="paragraph-85167b9f877b432ebeb78d8f9a153883"> <bold id="strong-84c1822755554bd58cb302864dd0657f">1964.48</bold></p>
                </td>
                <td id="table-cell-ad52a741cd864bef85309fb2581bed62" align="right">
                  <p id="paragraph-aed6f591f49b40cfb36ca89e8a46a60c"> 137.58</p>
                </td>
                <td id="table-cell-3cb568b0d8f246e898ee3b7a5d041d23" align="right">
                  <p id="paragraph-c4fa8adca42d4381b47a859651029cc5"> <bold id="strong-85cd1a3585294a8bae7b3237880bd9f3">126.51</bold></p>
                </td>
              </tr>
              <tr id="table-row-aec93545e0244a2c92bc72d839a41185">
                <td id="table-cell-e70a08663b844e33b1d9384af93fc6f1" align="left">
                  <p id="paragraph-41600fea3c3340109561bc7cf5669617">MAPE</p>
                </td>
                <td id="table-cell-205f667e604c497aac1f22344839520c" align="right">
                  <p id="paragraph-c5cd9a3cf28346c09a2ef8f638a20bff"> n/a</p>
                </td>
                <td id="table-cell-7937428a63c04fe2bb53e379be98725e" align="right">
                  <p id="paragraph-df1cbe83e7c54b429d085cb05a58242f"> n/a</p>
                </td>
                <td id="table-cell-aa9e3b2016914d3fa51d71ed92e32793" align="right">
                  <p id="paragraph-820033b9484649fb959e4631aa0091d9"> 118%</p>
                </td>
                <td id="table-cell-e0b298e1adf64c708e2f84fa2d3fbbbc" align="right">
                  <p id="paragraph-eb109444cff142238dbc78457799ed04"> <bold id="strong-7091eb0832d14512ac50ce015c8d448e">109%</bold></p>
                </td>
                <td id="table-cell-71713ed3c133428ea1388c60bfbfd711" align="right">
                  <p id="paragraph-c7bcf9fe03f442589e896df7e1614134"> 61%</p>
                </td>
                <td id="table-cell-bbb2d2b04f9d4bd29a828c17f0718af2" align="right">
                  <p id="paragraph-aff885812d7d4b9d9fa5d3a2a7f02143"> <bold id="strong-e98f876979174c99ab4be67c834a8860">55%</bold></p>
                </td>
                <td id="table-cell-a354a382e37e45deb5d92717539b2927" align="right">
                  <p id="paragraph-3f715a8690a04124838ea1846c9959e1"> n/a</p>
                </td>
                <td id="table-cell-aa6ab1c531af46cc88ece300e59e11ab" align="right">
                  <p id="paragraph-d1f9b54bca184e908bd12fe00475be5a"> n/a</p>
                </td>
              </tr>
              <tr id="table-row-a83b1e529d7c4efe9487d2c605f072e8">
                <td id="table-cell-406a950532ab4a62b17f02387b19789a" align="left">
                  <p id="paragraph-306aacc1acec487faeffbe9fd53e8a5e">RMSE</p>
                </td>
                <td id="table-cell-fdaf0f1640a046b28f760b9d5a6d72ba" align="right">
                  <p id="paragraph-e40f227e457e44d1a833e71e666a30c1"> 125.24</p>
                </td>
                <td id="table-cell-4ab0f2d8b4874a618c0fe9fba4826c21" align="right">
                  <p id="paragraph-897d5f1a25b54a659b4e025a04c062b5"> <bold id="strong-14f10e059b4441ccae7fea42724b61b9">97.49</bold></p>
                </td>
                <td id="table-cell-14a54580f7aa40c1901e283d25c4cd01" align="right">
                  <p id="paragraph-33700c8ff9cb4bbc97a75c7a92d95268"> <bold id="strong-d2f860e81ac54685acc5657364732871">409.42</bold></p>
                </td>
                <td id="table-cell-3df5756b59f048be83bc041e0d0532c4" align="right">
                  <p id="paragraph-edfd8d5b3fdc4c19ac55aaa0bb47cd2b"> 479.26</p>
                </td>
                <td id="table-cell-47f63b35da454a5d86c9a96681b1a423" align="right">
                  <p id="paragraph-8c7fbdc426334fadaec974f36dc4c6b1"> 3058.23</p>
                </td>
                <td id="table-cell-ab5e962670984e53992426ae535cd582" align="right">
                  <p id="paragraph-d5f3aef666aa48e5bf47f8895841c6bc"> <bold id="strong-57a5603be305432d9697b334269b8a21">2865.33</bold></p>
                </td>
                <td id="table-cell-b0d4942838e942ba9e09562465affbb4" align="right">
                  <p id="paragraph-73f0a5dee4324121a0c967838786e241"> 538.47</p>
                </td>
                <td id="table-cell-1ccab5d4dc4346abb2858cfd2f01c7f7" align="right">
                  <p id="paragraph-2881c94d17ce4b48a45fa098e3ef2b73"> <bold id="strong-5b252d462d3048d69377bb86d8af8075">514.75</bold></p>
                </td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn-group>
              <fn id="f-a795e88da306">
                <p id="p-eac709864225">Bolded values indicate best performing model.</p>
              </fn>
            </fn-group>
          </table-wrap-foot>
        </table-wrap>
        <p id="paragraph-1cd336831f3c4bf2b42134026491087c">Based on the AIC presented in <xref id="x-1768df719667" rid="table-wrap-cc7a640115ce47e2aaedc14182433222" ref-type="table">Table 4</xref>, we find that the MBRP model is an overall improvement over the traditional NB regression model. But the statistics presented in <xref id="x-ac19098733f7" rid="table-wrap-a70dd15f02bd4a1f8d06ae14d0e05f98" ref-type="table">Table 5</xref> allow for more distinct quantitative results. Over the whole test dataset, the MAE and RMSE both indicate that the MBRP model predicts more accurately than the NB regression model by about 8.0% and 4.4% respectively. This trend is consistently observed across the low- and high-count ranges, where MAE improves by 14.0% and 7.2%, respectively, and the RMSE is improved by 22.2% and 6.3%, respectively. The exception to the trend is in the mid-count range, where the MAE improves by 3.9%, but the RMSE increases by 17.1%. This anomaly can be attributed to a single predicted value with a large residual, which is then highly weighted in the RMSE calculation due to the squared component of the error statistic. The evaluation that the MBRP model outperforms the NB regression model even in the mid-count range is further supported by the 9.0% improvement in the MAPE, which is also observed in the high-count range. </p>
        <p id="paragraph-2d0ff3cb538743d9a457c01ef8128fbc">Accounting for evidence provided by the AIC as found in model development, the CURE plots generated for both models, and the goodness of fit statistics as calculated over the test dataset, the MBRP model improves upon the traditional NB regression model in predicting pedestrian count values. Though error evaluations differ in quantity, based on trends in the MAE, RMSE, and MAPE indicate that using MBRP to model pedestrian count data can improve prediction accuracy by approximately 10% compared to traditional NB regression models.</p>
      </sec>
    </sec>
    <sec>
      <title id="t-17c1a536c1b5">Conclusions </title>
      <p id="paragraph-83b86de1fe274d9fbeb0ed76629d6a88">This study investigates a possible improvement in pedestrian exposure modeling, by augmenting traditional NB regression models with a tree-based machine learning component, the MBRP algorithm. It was hypothesized that the inclusion of the MBRP algorithm would not only improve predictive accuracy but would allow for additional interpretation of the relationships between explanatory variables and pedestrian exposure estimates which may differ contextually in ways that are not known a priori. Data from North Carolina is subdivided into training and test dataset. Training data is applied to develop a traditional NB regression model and an MBRP model, and the two models’ predictive performance is assessed based on the predictions for the test dataset.</p>
      <p id="paragraph-586e41b6f1434fdd836cccd60fc082c7">The use of the MBRP algorithm resulted a model indicating that a pedestrian count’s relationship with explanatory variables varies with the natural logarithm of parcel count, which suggests that pedestrian counts in denser urban environments are more sensitive to presence of alcohol sales locations, and less sensitive to presence of sidewalks, crosswalks, bus stops, and roadways with higher speed limits. These trends are not observable through traditional NB models, which are typically more of a ‘one-size-fits-all approach which does not consider how the relationships between explanatory variables may vary with context.</p>
      <p id="paragraph-6248d336710a4fc692deb6568d1cfd28">The model developed using the MBRP algorithm improved predictions of pedestrian counts over the test dataset by approximately 10% as measured by MAE, MAPE, and RMSE. The model’s fitness was also shown to be an improvement over the NB regression model through lower AIC and the MBRP plotting more points within the confidence interval and nearer to zero on a CURE plot.</p>
      <p id="paragraph-0a344b1a792147a6b455de48be86569a">The proposed use of the MBRP algorithm to improve pedestrian exposure estimates overcomes the shortcomings of traditional NB regression methods by capturing relationships between explanatory variables in context. Fortunately, the methodology is quite transferable to other regions outside of North Carolina, given that the MBRP algorithm inherently contextualizes coefficient estimates and naturally defines its own optimal splitting points. However, given the difficulty of retaining statistically significant variables across sub-models in the MBRP model, it should be noted that the variables selected for the MBRP model presented in this paper may not be statistically significant in another region. Further optimization may be required for application elsewhere. The MBRP algorithm and other machine learning methods are also known to be ‘data hungry’, and therefore the predictive power of this model may be limited by the size of the available dataset. In practice, a larger dataset would yield better results and could allow for a deeper understanding of the relationships between explanatory variables, which may be more complex than the restricted model presented in this paper suggests.</p>
    </sec>
    <sec>
      <title id="t-1ca2a2a0d795">Funding</title>
      <p id="p-92c29ce6e801"> No external funding was used in this research.</p>
    </sec>
    <sec>
      <title id="t-c42dfc6d6338">Declaration of generative AI use in writing</title>
      <p id="p-ed12a99fb2f9">During the preparation of this work the authors used GPT-4 to check writing for grammatical errors and improve clarity of language in the final manuscript. The outputs were reviewed and revised by the authors who take full responsibility for the content of the publication.</p>
    </sec>
    <sec>
      <title id="t-de1bc5b7a39b">Declaration of competing interests</title>
      <p id="p-d6e867a2d03e">The authors declare no competing interests.</p>
    </sec>
    <sec>
      <title id="t-022bd947b437">Ethics statement</title>
      <p id="p-d97bf5a1346f">The research performed in this paper does not qualify as human subjects research and thus does not require any IRB protocol.</p>
    </sec>
  </body>
  <back>
    <ack id="ack-8709dfda44da">
      <title id="ack-title-2508ebe928b6">Acknowledgements</title>
      <p id="paragraph-b897984a408b">The data used for this project comes from a previous project supported by the North Carolina Department of Transportation which evaluated systemic risk factors in pedestrian safety outcomes. The authors would like to thank Daniel Carter and Brian Mayhew of NCDOT for providing the data, Ian Hamilton, Lauren Blackburn of VHB, and Ilgin Guler of Penn State for their collaboration.</p>
      <p id="p-acadc092f24c">An earlier version of this work was presented at the 9<sup id="s-d7a7da299f3f">th</sup> Road Safety and Simulation conference, held in Lexington, KY, USA, on 28–31 October 2024.</p>
    </ack>
    <fn-group id="fn-group-a4928a201d334c739a7eaa0e5732af92"/>
    <ref-list>
      <title>References</title>
      <ref id="R253150932180186">
        <element-citation publication-type="research-report">
          <person-group person-group-type="author">
            <name>
              <surname>NHTSA</surname>
              <given-names/>
            </name>
            <collab/>
          </person-group>
          <article-title>Traffic Safety Facts, 2021 Data: Pedestrians</article-title>
          <source>National Highway Traffic Safety Administration</source>
          <year>2023</year>
          <uri>https://crashstats.nhtsa.dot.gov/Api/Public/ViewPublication/813458</uri>
          <comment>DOT HS 813 458</comment>
        </element-citation>
      </ref>
      <ref id="R253150932180198">
        <element-citation publication-type="website">
          <person-group person-group-type="author">
            <name>
              <surname>NHTSA</surname>
              <given-names/>
            </name>
            <collab/>
          </person-group>
          <article-title>FARS Encyclopedia 2023</article-title>
          <source>National Highway Traffic Safety Administration</source>
          <year>2023</year>
          <uri>https://www-fars.nhtsa.dot.gov/Main/index.aspx</uri>
        </element-citation>
      </ref>
      <ref id="R253150932180199">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Sener</surname>
              <given-names>I</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>Emerging data for pedestrian and bicycle monitoring: sources and applications</article-title>
          <source>Transportation Research Interdisciplinary Perspectives</source>
          <year>2020</year>
          <volume>4</volume>
          <pub-id pub-id-type="doi">10.1016/j.trip.2020.100095</pub-id>
        </element-citation>
      </ref>
      <ref id="R253150932180206">
        <element-citation publication-type="research-report">
          <person-group person-group-type="author">
            <name>
              <surname>Lagerwey</surname>
              <given-names>P A</given-names>
            </name>
            <name>
              <surname>Hintze</surname>
              <given-names>M J</given-names>
            </name>
            <name>
              <surname>Elliott</surname>
              <given-names>J B</given-names>
            </name>
            <name>
              <surname>Toole</surname>
              <given-names>J L</given-names>
            </name>
            <name>
              <surname>Schneider</surname>
              <given-names>R J</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>Pedestrian and bicycle transportation along existing roadway—ActiveTrans priority tool guidebook</article-title>
          <source>National Cooperative Highway Research Program</source>
          <year>2015</year>
          <pub-id pub-id-type="doi">10.17226/22163</pub-id>
          <comment>Report 803</comment>
        </element-citation>
      </ref>
      <ref id="R253150932180205">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Behnam</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Patel</surname>
              <given-names>B G</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>Pedestrian volume estimation by land-use variables</article-title>
          <source>Transportation Engineering Journal of ASCE</source>
          <year>1977</year>
          <volume>103</volume>
          <issue>4</issue>
          <fpage>507</fpage>
          <lpage>520</lpage>
          <pub-id pub-id-type="doi">10.1061/TPEJAN.0000649</pub-id>
        </element-citation>
      </ref>
      <ref id="R253150932180200">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Griswold</surname>
              <given-names>J B</given-names>
            </name>
            <name>
              <surname>Medury</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Schneider</surname>
              <given-names>R J</given-names>
            </name>
            <name>
              <surname>Amos</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Grembek</surname>
              <given-names>O</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>A pedestrian exposure model for the California State highway system</article-title>
          <source>Transportation Research Record</source>
          <year>2019</year>
          <volume>2673</volume>
          <issue>4</issue>
          <fpage>941</fpage>
          <lpage>950</lpage>
          <pub-id pub-id-type="doi">10.1177/0361198119837235</pub-id>
        </element-citation>
      </ref>
      <ref id="R253150932180193">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Hankey</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Lindsey</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Borah</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Hoff</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Utecht</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Xu</surname>
              <given-names>Z</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>Estimating use of non-motorized infrastructure: Models of bicycle and pedestrian traffic in Minneapolis, MN</article-title>
          <source>Landscape and Urban Planning</source>
          <year>2012</year>
          <volume>107</volume>
          <issue>3</issue>
          <fpage>307</fpage>
          <lpage>316</lpage>
          <pub-id pub-id-type="doi">10.1016/j.landurbplan.2012.06.005</pub-id>
        </element-citation>
      </ref>
      <ref id="R253150932180197">
        <element-citation publication-type="website">
          <person-group person-group-type="author">
            <name>
              <surname>Haynes</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Andrzejewsk</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Saghir</surname>
              <given-names>Chade</given-names>
            </name>
            <name>
              <surname>Feng</surname>
              <given-names>Li-yang</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>GIS based bicycle &amp; pedestrian demand forecasting techniques</article-title>
          <source>U.S. Department of Transportation</source>
          <year>2010</year>
          <uri>https://www.fhwa.dot.gov/planning/tmip/community/webinars/summaries/20100429/index.cfm</uri>
          <comment>TMIP webinar</comment>
        </element-citation>
      </ref>
      <ref id="R253150932180191">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Lindsey</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Han</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Wilson</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Yang</surname>
              <given-names>J</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>Neighborhood correlates of urban trail use</article-title>
          <source>Journal of Physical Activity and Health</source>
          <year>2006</year>
          <volume>3</volume>
          <fpage>139</fpage>
          <lpage>157</lpage>
          <pub-id pub-id-type="doi">10.1123/jpah.3.s1.s139</pub-id>
        </element-citation>
      </ref>
      <ref id="R253150932180187">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Lindsey</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Wilson</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Rubchinskaya</surname>
              <given-names>E</given-names>
            </name>
            <name>
              <surname>Yang</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Han</surname>
              <given-names>Y</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>Estimating urban trail traffic: Methods for existing and proposed trails</article-title>
          <source>Landscape and Urban Planning</source>
          <year>2007</year>
          <volume>81</volume>
          <issue>4</issue>
          <fpage>299</fpage>
          <lpage>315</lpage>
          <pub-id pub-id-type="doi">10.1016/j.landurbplan.2007.01.004</pub-id>
        </element-citation>
      </ref>
      <ref id="R253150932180183">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Griswold</surname>
              <given-names>J</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>Pedestrian volume modeling: A case study of San Francisco</article-title>
          <source>Association of Pacific Coast Geographers</source>
          <year>2009</year>
          <volume>71</volume>
          <issue>1</issue>
          <fpage>164</fpage>
          <lpage>181</lpage>
          <pub-id pub-id-type="doi">10.1353/pcg.0.0030</pub-id>
        </element-citation>
      </ref>
      <ref id="R253150932180194">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Miranda-Moreno</surname>
              <given-names>L F</given-names>
            </name>
            <name>
              <surname>Fernandes</surname>
              <given-names>D</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>Modeling of pedestrian activity at signalized intersections land use, urban form, weather, and spatiotemporal patterns</article-title>
          <source>Transportation Research Record</source>
          <year>2011</year>
          <volume>2264</volume>
          <issue>1</issue>
          <fpage>74</fpage>
          <lpage>82</lpage>
          <pub-id pub-id-type="doi">10.3141/2264-09</pub-id>
        </element-citation>
      </ref>
      <ref id="R253150932180189">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Pulugurtha</surname>
              <given-names>S S</given-names>
            </name>
            <name>
              <surname>Repaka</surname>
              <given-names>S R</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>Assessment of models to measure pedestrian activity at signalized intersections</article-title>
          <source>Transportation Research Record</source>
          <year>2008</year>
          <volume>2073</volume>
          <issue>1</issue>
          <fpage>39</fpage>
          <lpage>48</lpage>
          <pub-id pub-id-type="doi">10.3141/2073-05</pub-id>
        </element-citation>
      </ref>
      <ref id="R253150932180196">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Schneider</surname>
              <given-names>R J</given-names>
            </name>
            <name>
              <surname>Arnold</surname>
              <given-names>L S</given-names>
            </name>
            <name>
              <surname>Ragland</surname>
              <given-names>D R</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>Pilot model for estimating pedestrian intersection crossing volumes</article-title>
          <source>Transportation Research Record</source>
          <year>2009</year>
          <volume>2140</volume>
          <issue>1</issue>
          <fpage>13</fpage>
          <lpage>26</lpage>
          <pub-id pub-id-type="doi">10.3141/2140-02</pub-id>
        </element-citation>
      </ref>
      <ref id="R253150932180203">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Schneider</surname>
              <given-names>R J</given-names>
            </name>
            <name>
              <surname>Henry</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Mitman</surname>
              <given-names>M F</given-names>
            </name>
            <name>
              <surname>Stonehill</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Koehler</surname>
              <given-names>J</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>Development and application of volume model for pedestrian intersections in San Francisco, California</article-title>
          <source>Transportation Research Record</source>
          <year>2012</year>
          <volume>2299</volume>
          <issue>1</issue>
          <fpage>65</fpage>
          <lpage>78</lpage>
          <pub-id pub-id-type="doi">10.3141/2299-08</pub-id>
        </element-citation>
      </ref>
      <ref id="R253150932180204">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Abdel-Aty</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Shah</surname>
              <given-names>I</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>Evaluation of surrogate measures for pedestrian trips at intersections and crash modeling</article-title>
          <source>Accident Analysis &amp; Prevention</source>
          <year>2019</year>
          <volume>130</volume>
          <fpage>91</fpage>
          <lpage>98</lpage>
          <pub-id pub-id-type="doi">10.1016/j.aap.2018.05.015</pub-id>
        </element-citation>
      </ref>
      <ref id="R253150932180202">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Hankey</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Lindsey</surname>
              <given-names>G</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>Facility-demand models of peak period pedestrian and bicycle traffic comparison of fully specified and reduced-form models</article-title>
          <source>Transportation Research Record</source>
          <year>2016</year>
          <volume>2586</volume>
          <fpage>48</fpage>
          <lpage>58</lpage>
          <pub-id pub-id-type="doi">10.3141/2586-06</pub-id>
        </element-citation>
      </ref>
      <ref id="R253150932180201">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Hankey</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Lu</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Mondschein</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Buehler</surname>
              <given-names>R</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>Spatial models of active travel in small communities: Merging the goals of traffic monitoring and direct-demand modeling</article-title>
          <source>Journal of Transport &amp; Health</source>
          <year>2017</year>
          <volume>7</volume>
          <fpage>149</fpage>
          <lpage>159</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jth.2017.08.009</pub-id>
        </element-citation>
      </ref>
      <ref id="R253150932180195">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Lu</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Mondschein</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Buehler</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Hankey</surname>
              <given-names>S</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>Adding temporal information to direct-demand models: Hourly estimation of bicycle and pedestrian traffic in Blacksburg, VA</article-title>
          <source>Transportation Research Part D: Transport and Environment</source>
          <year>2018</year>
          <volume>63</volume>
          <fpage>244</fpage>
          <lpage>260</lpage>
          <pub-id pub-id-type="doi">10.1016/j.trd.2018.05.011</pub-id>
        </element-citation>
      </ref>
      <ref id="R253150932180184">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Kashani</surname>
              <given-names>A T</given-names>
            </name>
            <name>
              <surname>Mohaymany</surname>
              <given-names>A S</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>Analysis of the traffic injury severity on two-lane, two-way rural roads based on classification tree models</article-title>
          <source>Safety Science</source>
          <year>2011</year>
          <volume>49</volume>
          <issue>10</issue>
          <fpage>1314</fpage>
          <lpage>1320</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ssci.2011.04.019</pub-id>
        </element-citation>
      </ref>
      <ref id="R253150932180185">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Seibold</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Zeileis</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Hothorn</surname>
              <given-names>T</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>Model-based recursive partitioning for subgroup analyses</article-title>
          <source>The International Journal of Biostatistics</source>
          <year>2016</year>
          <volume>12</volume>
          <issue>1</issue>
          <fpage>45</fpage>
          <lpage>63</lpage>
          <pub-id pub-id-type="doi">10.1515/ijb-2015-0032</pub-id>
        </element-citation>
      </ref>
      <ref id="R253150932180181">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Tang</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Donnell</surname>
              <given-names>E T</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>Application of a model-based recursive partitioning algorithm to predict crash frequency</article-title>
          <source>Accident Analysis &amp; Prevention</source>
          <year>2019</year>
          <volume>132</volume>
          <fpage>105274</fpage>
          <pub-id pub-id-type="doi">10.1016/j.aap.2019.105274</pub-id>
        </element-citation>
      </ref>
      <ref id="R253150932180207">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zeileis</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Hornik</surname>
              <given-names>K</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>Generalized M-Fluctuation tests for parameter instability</article-title>
          <source>Statistica Neerlandica</source>
          <year>2007</year>
          <volume>61</volume>
          <fpage>488</fpage>
          <lpage>508</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1467-9574.2007.00371.x</pub-id>
        </element-citation>
      </ref>
      <ref id="R253150932180192">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zeileis</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Hothorn</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Hornik</surname>
              <given-names>K</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>Model-based recursive partitioning</article-title>
          <source>Journal of Computational and Graphical Statistics</source>
          <year>2008</year>
          <volume>17</volume>
          <fpage>492</fpage>
          <lpage>514</lpage>
          <pub-id pub-id-type="doi">10.1198/106186008X319331</pub-id>
        </element-citation>
      </ref>
      <ref id="R253150932180182">
        <element-citation publication-type="research-report">
          <person-group person-group-type="author">
            <name>
              <surname>Gayah</surname>
              <given-names>V V</given-names>
            </name>
            <name>
              <surname>Guler</surname>
              <given-names>S I</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Blackburn</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Hamilton</surname>
              <given-names>I</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>Quantification of Systemic Risk Factors for Pedestrian Safety on North Carolina</article-title>
          <source>FHWA</source>
          <year>2022</year>
          <uri>https://connect.ncdot.gov/projects/research/Pages/ProjDetails.aspx?ProjectID=2022-11</uri>
          <comment>NCDOT Project 2022-11</comment>
        </element-citation>
      </ref>
      <ref id="R253150932180188">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Frank</surname>
              <given-names>L D</given-names>
            </name>
            <name>
              <surname>Andresen</surname>
              <given-names>M A</given-names>
            </name>
            <name>
              <surname>Schmid</surname>
              <given-names>T L</given-names>
            </name>
            <collab/>
          </person-group>
          <article-title>Obesity relationships with community design, physical activity, and time spent in cars</article-title>
          <source>American Journal of Preventative Medicine</source>
          <year>2004</year>
          <volume>27</volume>
          <issue>2</issue>
          <fpage>87</fpage>
          <lpage>96</lpage>
          <pub-id pub-id-type="doi">10.1016/j.amepre.2004.04.011</pub-id>
        </element-citation>
      </ref>
      <ref id="R253150932180190">
        <element-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Hauer</surname>
              <given-names>E</given-names>
            </name>
            <collab/>
          </person-group>
          <person-group person-group-type="editor"/>
          <source>The Art of Regression Modeling in Road Safety</source>
          <publisher-name>Springer</publisher-name>
          <publisher-loc>New York</publisher-loc>
          <year>2015</year>
          <pub-id pub-id-type="doi">10.1007/978-3-319-12529-9</pub-id>
        </element-citation>
      </ref>
    </ref-list>
  </back>
</article>
