<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Sustain. Cities</journal-id>
<journal-title>Frontiers in Sustainable Cities</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Sustain. Cities</abbrev-journal-title>
<issn pub-type="epub">2624-9634</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/frsc.2025.1649853</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Sustainable Cities</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Risk prediction of new energy vehicle based on dynamic-static feature fusion</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name><surname>Zhang</surname> <given-names>Xiang</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/3079593/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Yin</surname> <given-names>Xiaoxuan</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="corresp" rid="c002"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/3105742/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Huang</surname> <given-names>Shubing</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhang</surname> <given-names>Ge</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/3105528/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Wang</surname> <given-names>Chongming</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Traffic Management Research Institute of the Ministry of Public Security</institution>, <addr-line>Wuxi</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>National Engineering Research Center for Electric Vehicles, Beijing Institute of Technology</institution>, <addr-line>Beijing</addr-line>, <country>China</country></aff>
<aff id="aff3"><sup>3</sup><institution>The Center for E-Mobility and Clean Growth, Coventry University</institution>, <addr-line>Coventry</addr-line>, <country>United Kingdom</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Salvador Garc&#x000ED;a-Ayll&#x000F3;n Veintimilla, Polytechnic University of Cartagena, Spain</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Pendela Kanchanamala, GMR Institute of Technology, India</p>
<p>Bittu Ghosh, National Institute of Technology, Durgapur, India</p></fn>
<corresp id="c001">&#x0002A;Correspondence: Xiang Zhang <email>zhangxiang&#x00040;tmri.cn</email></corresp>
<corresp id="c002">Xiaoxuan Yin <email>xiaoxuan_yin&#x00040;bit.edu.cn</email></corresp>
</author-notes>
<pub-date pub-type="epub">
<day>25</day>
<month>08</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>7</volume>
<elocation-id>1649853</elocation-id>
<history>
<date date-type="received">
<day>19</day>
<month>06</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>31</day>
<month>07</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2025 Zhang, Yin, Huang, Zhang and Wang.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Zhang, Yin, Huang, Zhang and Wang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<p>To support the goals of low-carbon and sustainable development, new energy vehicles (NEVs) are being increasingly adopted. However, the frequency of traffic accidents involving NEVs also shows a rising trend. To address this challenge, this paper proposes an accident risk prediction method for new energy vehicles based on dynamic-static feature fusion. First, direct and indirect data strongly related to accident risk are extracted from the full-year accident data of a province in 2021, including environmental factors (weather and road type), dynamic operating data (speed), vehicle alarm status, and historical accident characteristics. Then, to quantify and capture the potential risk characteristics of the vehicle, LSTM layers are used to construct dynamic and static feature vectors representing vehicle accident risk. Moreover, the accident risk probability is calculated based on fully connected layers and the sigmoid activation function. Finally, the proposed accident risk prediction model is tested and validated with real accident data. The results show that the model achieves a prediction accuracy of 85% for new energy vehicle accidents, which is a 24% improvement over traditional models based on weather and road types. The model can timely warn drivers before accidents occur, helping them take necessary safety measures to reduce accident probability.</p></abstract>
<kwd-group>
<kwd>new energy vehicle</kwd>
<kwd>accident risk prediction</kwd>
<kwd>dynamic-static feature fusion</kwd>
<kwd>long short-term memory</kwd>
<kwd>traffic safety</kwd>
</kwd-group>
<counts>
<fig-count count="10"/>
<table-count count="6"/>
<equation-count count="23"/>
<ref-count count="46"/>
<page-count count="13"/>
<word-count count="8645"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Urban Transportation Systems and Mobility</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>1 Introduction</title>
<p>As a central force in the low-carbon transition of the transportation sector, New Energy Vehicles (NEVs) significantly reduce dependence on fossil fuels and greenhouse gas emissions by optimizing energy structures and minimizing lifecycle carbon footprints. NEVs have thus become a key component in building sustainable transportation systems globally. According to statistics from the Traffic Management Bureau of the Ministry of Public Security, the number of newly registered NEVs has surged from 1.2 million in 2019 to 7.43 million in 2023, reflecting a rapid-growth trend (<xref ref-type="bibr" rid="B25">Ministry of Public Security, 2024</xref>). However, frequent safety incidents during the large-scale deployment of NEVs, such as battery thermal runaway and fire caused by collisions, not only pose serious threats to public safety but may also undermine their environmental benefits in several ways (<xref ref-type="bibr" rid="B46">Zhao et al., 2025</xref>). On one hand, accidents can lead to vehicle damage, battery pollution, and secondary environmental risks, directly reducing carbon reduction gains. On the other hand, the resulting traffic congestion, emergency resource usage, and decline in public trust may indirectly hinder NEV market adoption and infrastructure development, limiting the overall progress toward a sustainable road transport system. In response, researchers have carried out extensive studies and proposed various solutions to reduce both the frequency and severity of accidents. Among these efforts, accident risk prediction models have attracted considerable attention due to their potential to provide early warnings and significantly decrease the likelihood of traffic incidents.</p>
<p>Traffic accident risk prediction models seek to prevent accidents by gaining a deep understanding of the factors that contribute to their occurrence and by predicting the corresponding risk levels. These models typically rely on techniques such as data-driven analysis (<xref ref-type="bibr" rid="B22">Lin et al., 2015</xref>; <xref ref-type="bibr" rid="B3">Aung et al., 2018</xref>; <xref ref-type="bibr" rid="B2">Ardakani et al., 2023</xref>), machine learning (<xref ref-type="bibr" rid="B45">Zhao et al., 2019</xref>; <xref ref-type="bibr" rid="B6">Br&#x000FC;hwiler et al., 2022</xref>; <xref ref-type="bibr" rid="B20">Li and Yu, 2025</xref>; <xref ref-type="bibr" rid="B19">Li and Chen, 2025</xref>; <xref ref-type="bibr" rid="B43">Zhang et al., 2022</xref>; <xref ref-type="bibr" rid="B12">Ghasedi et al., 2021</xref>; <xref ref-type="bibr" rid="B5">Berhanu et al., 2023</xref>; <xref ref-type="bibr" rid="B32">Santos et al., 2021</xref>; <xref ref-type="bibr" rid="B29">Prajapati et al., 2023</xref>; <xref ref-type="bibr" rid="B1">Ahmed et al., 2023</xref>), and neural networks (<xref ref-type="bibr" rid="B21">Lin et al., 2021</xref>; <xref ref-type="bibr" rid="B33">Shaik et al., 2021</xref>; <xref ref-type="bibr" rid="B26">Najafi Moghaddam Gilani et al., 2021</xref>; <xref ref-type="bibr" rid="B42">Yu et al., 2021</xref>; <xref ref-type="bibr" rid="B8">Chakraborty et al., 2019</xref>; <xref ref-type="bibr" rid="B13">Ghosh and Karmakar, 2025</xref>; <xref ref-type="bibr" rid="B17">Kaffash Charandabi et al., 2022</xref>; <xref ref-type="bibr" rid="B36">Wang et al., 2021</xref>), and deep learning (<xref ref-type="bibr" rid="B30">Ren et al., 2018</xref>; <xref ref-type="bibr" rid="B4">Basso et al., 2021</xref>; <xref ref-type="bibr" rid="B35">Sun et al., 2024</xref>) to capture complex patterns in traffic data and assess the likelihood of accidents under various conditions. <xref ref-type="bibr" rid="B22">Lin et al. (2015)</xref> proposed a novel variable selection method based on the Frequent Pattern Tree algorithm, which was integrated with the k-nearest neighbors&#x00027; model and Bayesian network to enable real-time traffic accident risk prediction. <xref ref-type="bibr" rid="B3">Aung et al. (2018)</xref> introduced an accident prediction algorithm tailored for urban environments. By incorporating variables such as vehicle speed, weather conditions, and driver fatigue, the model employed a Hidden Markov Model (HMM) to establish correlations between observed data and potential accident risks. <xref ref-type="bibr" rid="B28">Park and Hong (2022)</xref> proposed a deep learning-based accident risk prediction model that integrates both static and dynamic road features, to accurately assess the risk of accident occurrence under varying road and environmental conditions. <xref ref-type="bibr" rid="B44">Zhao et al. (2022)</xref> presented an accident risk prediction approach that combines deep convolutional neural networks (CNN) with a random forest classifier. The CNN was used to extract key features from the data, while the random forest comprising multiple decision trees was used to output the associated risk of a traffic accident.</p>
<p>Considering accident-related factors is crucial for improving the accuracy of traffic accident risk prediction. However, the causes of traffic accidents are complex and diverse, increasing the difficulty of accident risk prediction. Existing research has extensively explored the impact of vehicle factors and external environmental factors on traffic risks (<xref ref-type="bibr" rid="B41">Yannis et al., 2017</xref>; <xref ref-type="bibr" rid="B31">Roland et al., 2021</xref>; <xref ref-type="bibr" rid="B12">Ghasedi et al., 2021</xref>). Vehicle factors primarily refer to the operating state of the vehicle during driver operation, including vehicle spacing, steering angle changes, lateral acceleration, and yaw rate (<xref ref-type="bibr" rid="B10">Enache et al., 2009</xref>; <xref ref-type="bibr" rid="B27">Ning et al., 2009</xref>). Studies have shown that the vehicle&#x00027;s operating state can indirectly reflect the driver&#x00027;s condition after excluding driver skill differences. Based on this fundamental characteristic, some researchers have analyzed driving behavior or driving risks using vehicle operation state data (<xref ref-type="bibr" rid="B24">Mantouka et al., 2019</xref>). For example, <xref ref-type="bibr" rid="B37">Wang et al. (2011)</xref> considered the factors, such as speed and acceleration, to establish a risk assessment model. <xref ref-type="bibr" rid="B23">Mandal et al. (2016)</xref> used time-series measurements of driving behavior and a particle swarm-optimized artificial neural network algorithm to classify driver states and assess driving risk. Research shows that the external environment, including weather and road conditions, significantly affects driving safety (<xref ref-type="bibr" rid="B11">Feng et al., 2010</xref>; <xref ref-type="bibr" rid="B15">Hassan and Abdel-Aty, 2011</xref>; <xref ref-type="bibr" rid="B38">Xiao et al., 2000</xref>; <xref ref-type="bibr" rid="B18">Koramati et al., 2022</xref>; <xref ref-type="bibr" rid="B14">Hao et al., 2015</xref>; <xref ref-type="bibr" rid="B40">Xu X. L., 2013</xref>; <xref ref-type="bibr" rid="B7">Casner et al., 2016</xref>). For example, <xref ref-type="bibr" rid="B39">Xu C. C. (2013)</xref> established an accident risk model for adverse weather using real-time data and logistic regression models, finding that the impact of rain on risk is greater than that of fog. <xref ref-type="bibr" rid="B9">Chen et al. (2009)</xref> quantitatively analyzed the impact of road type, specifications, alignment, sight distance, and pavement condition on accident rates based on Bayesian theory. The study found that under the same traffic flow, the accident rate decreases with the improvement of road specifications.</p>
<p>The studies mentioned above mainly analyze the independent impact of individual factors on traffic accidents, such as driving conditions, vehicle speed, acceleration, and external environmental factors like adverse weather and road conditions on driving safety. However, they seldom consider the dynamic association between vehicle factors and external environmental factors, as well as the coupling effects between different factors on traffic risk. Therefore, how to effectively integrate vehicle factors and external environmental factors to achieve multi-source data fusion and accurately predict risks is a significant challenge in the field of traffic safety.</p>
<p>To address the above problems, this paper proposes an accident risk prediction model for new energy vehicles based on dynamic-static feature fusion. Key feature parameters strongly correlated with accident risk are extracted by analyzing the impact of accident risk factors on the risk of NEV accidents. Based on this, the LSTM algorithm is employed to establish a mapping relationship from dynamic-static feature parameters to NEV accident risk, enabling accurate prediction of NEV accidents. The main innovations are as follows:</p>
<list list-type="simple">
<list-item><p>(1) Relying on vehicle status data and external environmental data from national regulatory platforms, a novel accident risk prediction model is proposed based on the dynamic-static feature fusion, accurately predicting the occurrence of accidents.</p></list-item>
<list-item><p>(2) A mapping is established between dynamic-static feature parameters and NEV accident risk based on the LSTM algorithm. This approach accurately captures dynamic and static risk patterns in time-series data, offers new insights into risk assessment for driving safety, and provides reliable data support for accident prevention.</p></list-item>
</list>
</sec>
<sec id="s2">
<title>2 Introduction to accident risk factors</title>
<p>The selection of key influencing factors for new energy vehicle accidents is fundamental to establishing an accurate accident risk prediction model. To improve the prediction accuracy of the accident risk model, this paper extracts direct and indirect information data related to NEV accidents from a full year of accident records in a specific province in 2021. The direct information data includes the time, location, involved vehicles, and causes of the accidents. The indirect information data primarily includes road features and weather conditions.</p>
<sec>
<title>2.1 Weather conditions</title>
<p>Weather conditions play a critical role in driving safety. Adverse weather such as rain or snow can lead to slippery road surfaces, increasing braking distances and significantly elevating the likelihood of traffic accidents. Moreover, under low-visibility conditions such as fog or haze, the limited visual perception of the drivers further amplifies the risk of collisions. Although the overall accident rate under clear weather is relatively low, the probability of severe accidents tends to be higher due to higher driving speeds. Therefore taking weather conditions as an input variable in predictive models can help identify risks induced by environmental factors.</p>
<p>To achieve accurate prediction of accident severity, the weather conditions are cate-gorized into 19 distinct types, as shown in <xref ref-type="table" rid="T1">Table 1</xref>. However, considering that some weather types occur infrequently and to simplify the modeling process, these categories were consolidated into five broader groups: sunny, overcast, snowy, rainy, and foggy.</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>Weather conditions.</p></caption>
<table frame="box" rules="all">
<thead>
<tr style="background-color:#919498;color:#ffffff">
<th valign="top" align="left"><bold>Index</bold></th>
<th valign="top" align="left"><bold>Weather type</bold></th>
<th valign="top" align="center"><bold>Index</bold></th>
<th valign="top" align="left"><bold>Weather type</bold></th>
<th valign="top" align="center"><bold>Index</bold></th>
<th valign="top" align="left"><bold>Weather type</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">1</td>
<td valign="top" align="left">Sunny</td>
<td valign="top" align="center">8</td>
<td valign="top" align="left">Light snow</td>
<td valign="top" align="center">15</td>
<td valign="top" align="left">Blizzard</td>
</tr>
<tr>
<td valign="top" align="left">2</td>
<td valign="top" align="left">Overcast</td>
<td valign="top" align="center">9</td>
<td valign="top" align="left">Moderate snow</td>
<td valign="top" align="center">16</td>
<td valign="top" align="left">Sandstorm</td>
</tr>
<tr>
<td valign="top" align="left">3</td>
<td valign="top" align="left">Cloudy</td>
<td valign="top" align="center">10</td>
<td valign="top" align="left">Heavy snow</td>
<td valign="top" align="center">17</td>
<td valign="top" align="left">Torrential rain</td>
</tr>
<tr>
<td valign="top" align="left">4</td>
<td valign="top" align="left">Sleet</td>
<td valign="top" align="center">11</td>
<td valign="top" align="left">Fog</td>
<td valign="top" align="center">18</td>
<td valign="top" align="left">Haze</td>
</tr>
<tr>
<td valign="top" align="left">5</td>
<td valign="top" align="left">Light rain</td>
<td valign="top" align="center">12</td>
<td valign="top" align="left">Heavy rain</td>
<td valign="top" align="center">19</td>
<td valign="top" align="left">Dust</td>
</tr>
<tr>
<td valign="top" align="left">6</td>
<td valign="top" align="left">Moderate rain</td>
<td valign="top" align="center">13</td>
<td valign="top" align="left">Thunderstorm</td>
<td/>
<td/>
</tr>
<tr>
<td valign="top" align="left">7</td>
<td valign="top" align="left">Showers</td>
<td valign="top" align="center">14</td>
<td valign="top" align="left">Snow showers</td>
<td/>
<td/>
</tr></tbody>
</table>
</table-wrap>
<p>As shown in <xref ref-type="fig" rid="F1">Figure 1</xref>, the majority of traffic accidents occur under sunny weather conditions, accounting for 85.53% of the total. This is followed by overcast (8.31%) and rainy (4.85%) conditions. Snowy weather accounts for the smallest proportion, with only 0.6% of total accidents. The high number of accidents under sunny weather conditions is primarily attributed to their high frequency throughout the year.</p>
<fig position="float" id="F1">
<label>Figure 1</label>
<caption><p>The distribution of traffic accidents under different weather conditions in a province in 2021.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frsc-07-1649853-g0001.tif">
<alt-text>Pie chart showing the proportion of traffic accidents by weather condition in a province in 2021. Sunny conditions account for 83%, overcast 8%, snowy 5%, rainy 3%, and foggy 1%.</alt-text>
</graphic>
</fig>
</sec>
<sec>
<title>2.2 Road types</title>
<p>Road type significantly influences the risk of accidents by interacting with vehicle speed and traffic complexity. This paper divides road types into ten categories, as shown in <xref ref-type="table" rid="T2">Table 2</xref>. It also presents the distribution of accidents across different road types in 2021, as shown in <xref ref-type="fig" rid="F2">Figure 2</xref>. On highways, the higher driving speeds lead to an increased accident rate. Although vehicles on urban roads travel at lower speeds, they are more likely to be disrupted by factors, such as pedestrians, non-motorized vehicles, and traffic signals, significantly increasing the probability of low-speed collisions. On rural roads, the lack of comprehensive traffic infrastructure, sharp turns, and complex road conditions greatly increase the risk of accidents. Therefore, the road type significantly influences accident risk.</p>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p>Road types.</p></caption>
<table frame="box" rules="all">
<thead>
<tr style="background-color:#919498;color:#ffffff">
<th valign="top" align="left"><bold>Road type code</bold></th>
<th valign="top" align="left"><bold>Description</bold></th>
<th valign="top" align="center"><bold>Road type code</bold></th>
<th valign="top" align="left"><bold>Description</bold></th>
<th valign="top" align="center"><bold>Road type code</bold></th>
<th valign="top" align="left"><bold>Description</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">1</td>
<td valign="top" align="left">Expressway</td>
<td valign="top" align="center">5</td>
<td valign="top" align="left">Rural road</td>
<td valign="top" align="center">9</td>
<td valign="top" align="left">Urban branch road</td>
</tr>
<tr>
<td valign="top" align="left">2</td>
<td valign="top" align="left">National road</td>
<td valign="top" align="center">6</td>
<td valign="top" align="left">Urban expressway</td>
<td valign="top" align="center">10</td>
<td valign="top" align="left">Other roads</td>
</tr>
<tr>
<td valign="top" align="left">3</td>
<td valign="top" align="left">Provincial road</td>
<td valign="top" align="center">7</td>
<td valign="top" align="left">Urban arterial road</td>
<td/>
<td/>
</tr>
<tr>
<td valign="top" align="left">4</td>
<td valign="top" align="left">County road</td>
<td valign="top" align="center">8</td>
<td valign="top" align="left">Urban secondary road</td>
<td/>
<td/>
</tr></tbody>
</table>
</table-wrap>
<fig position="float" id="F2">
<label>Figure 2</label>
<caption><p>The number of traffic accidents across different road types in a province in 2021.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frsc-07-1649853-g0002.tif">
<alt-text>Bar chart showing the number of traffic accidents by road type in a province in 2021. Urban secondary roads have the highest accident count, followed by rural roads and urban branch roads. Expressways and urban expressways have the lowest counts.</alt-text>
</graphic>
</fig>
</sec>
<sec>
<title>2.3 Vehicle speed</title>
<p>Vehicle speed is a direct factor influencing both the accident occurrence rate and severity. Higher speeds not only increase braking response time but also reduce the driver&#x00027;s ability to react to sudden situations, sharply increasing the probability of accidents. Additionally, continuous speed data can help analyze driving behavior and traffic flow. Real-time monitoring of vehicle speed allows for the timely identification of abnormal behaviors such as sudden acceleration and hard breaking, which are significant factors contributing to accidents. Therefore, incorporating vehicle speed as a time-series input feature in the model helps accurately predict the occurrence of accidents. Additionally, the distribution of traffic accidents by speed in 2021 is recorded (as shown in <xref ref-type="fig" rid="F3">Figure 3</xref>) and used for feature contribution assessment.</p>
<fig position="float" id="F3">
<label>Figure 3</label>
<caption><p>The histogram of traffic accidents by vehicle speed in a province in 2021.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frsc-07-1649853-g0003.tif">
<alt-text>Histogram of traffic accidents by vehicle speed in a province in 2021. The x-axis represents vehicle speed intervals, and the y-axis represents the number of accidents. Higher accident frequencies are observed at lower speeds, peaking around 20 to 30 kilometers per hour.</alt-text>
</graphic>
</fig>
</sec>
<sec>
<title>2.4 Vehicle alarm information</title>
<p>The alarm information of new energy vehicles effectively reflects the vehicle&#x00027;s internal status and potential faults. Alarms for high battery temperature, undervoltage, or overvoltage may lead to vehicle loss of control, which is particularly dangerous at high speeds. Alarms related to driving motor anomalies and motor controller failures may cause stalling or loss of control, increasing the risk of accidents. Brake system alarms often accompany reduced braking performance, raising the likelihood of collisions. Therefore, incorporating alarm information as an important variable in the model helps capture potential fault risks in the vehicle. There are 19 types of alarm statuses for new energy vehicle accidents, as detailed in <xref ref-type="table" rid="T3">Table 3</xref>.</p>
<table-wrap position="float" id="T3">
<label>Table 3</label>
<caption><p>New energy vehicle fault alarm codes.</p></caption>
<table frame="box" rules="all">
<thead>
<tr style="background-color:#919498;color:#ffffff">
<th valign="top" align="left"><bold>Alarm code</bold></th>
<th valign="top" align="left"><bold>Status description</bold></th>
<th valign="top" align="center"><bold>Alarm code</bold></th>
<th valign="top" align="left"><bold>Status description</bold></th>
<th valign="top" align="center"><bold>Alarm code</bold></th>
<th valign="top" align="left"><bold>Status description</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">0</td>
<td valign="top" align="left">No fault</td>
<td valign="top" align="center">7</td>
<td valign="top" align="left">DC-DC temperature alarm</td>
<td valign="top" align="center">14</td>
<td valign="top" align="left">Single battery overvoltage alarm</td>
</tr>
<tr>
<td valign="top" align="left">1</td>
<td valign="top" align="left">Overcharge of energy storage device</td>
<td valign="top" align="center">8</td>
<td valign="top" align="left">Insulation alarm</td>
<td valign="top" align="center">15</td>
<td valign="top" align="left">Low SOC alarm</td>
</tr>
<tr>
<td valign="top" align="left">2</td>
<td valign="top" align="left">Drive motor temperature alarm</td>
<td valign="top" align="center">9</td>
<td valign="top" align="left">Power battery consistency difference alarm</td>
<td valign="top" align="center">16</td>
<td valign="top" align="left">Energy storage device under voltage alarm</td>
</tr>
<tr>
<td valign="top" align="left">3</td>
<td valign="top" align="left">High-voltage interlock alarm</td>
<td valign="top" align="center">10</td>
<td valign="top" align="left">Rechargeable energy storage system mismatch alarm</td>
<td valign="top" align="center">17</td>
<td valign="top" align="left">Energy storage device overvoltage alarm</td>
</tr>
<tr>
<td valign="top" align="left">4</td>
<td valign="top" align="left">Drive motor controller temperature alarm</td>
<td valign="top" align="center">11</td>
<td valign="top" align="left">SOC jump alarm</td>
<td valign="top" align="center">18</td>
<td valign="top" align="left">Battery high-temperature alarm</td>
</tr>
<tr>
<td valign="top" align="left">5</td>
<td valign="top" align="left">DC-DC status alarm</td>
<td valign="top" align="center">12</td>
<td valign="top" align="left">High SOC alarm</td>
<td valign="top" align="center">19</td>
<td valign="top" align="left">Temperature difference alarm</td>
</tr>
<tr>
<td valign="top" align="left">6</td>
<td valign="top" align="left">Brake system alarm</td>
<td valign="top" align="center">13</td>
<td valign="top" align="left">Single battery under voltage alarm</td>
<td/>
<td/>
</tr></tbody>
</table>
</table-wrap>
</sec>
<sec>
<title>2.5 Vehicle history accident information</title>
<p>Historical accident information is the key variable in constructing an accident prediction model and holds significant value for analyzing the risk of accidents under different conditions. This paper extracts historical accident information from two aspects: accident type and accident frequency, to enhance the model&#x00027;s ability to predict future accident types and occurrence probabilities.</p>
<p>Accident types typically include five categories: scratching, collision, running over, rollover, and battery fire/explosion. Each type of accident has its specific causes and characteristics. Analyzing different accident types can reveal their risk tendencies under specific driving conditions. For example, collisions are more common on highways, while rollovers are more likely to occur on sharp turns or slippery road sections. Taking historical accident types as input variables helps the model accurately identify accident patterns, to optimize the prediction results.</p>
<p>Moreover, accident frequency is a key indicator for assessing accident likelihood. By analyzing the historical occurrence of specific accident types, the potential high-risk areas and contributing factors can be identified. Integrating accident frequency into the model enhances the accuracy of hotspot detection and improves overall prediction performance.</p>
<p>Based on the above analysis about accident-related factors, this paper selects environmental factors (weather and road type), dynamic operating data (speed), vehicle alarm status, and historical accident features as the model inputs. Environmental factors reflect external driving conditions, while dynamic operating data describes the vehicle&#x00027;s real-time operating status. Vehicle alarm status reveals potential technical faults, and historical accident features can reflect the vehicle&#x00027;s accident tendencies. By integrating these features, the models can capture multi-dimensional information affecting accident occurrence, leading to more accurate risk prediction.</p>
</sec>
<sec>
<title>2.6 Feature contribution assessment</title>
<p>To quantitatively assess the contribution of different accident features to traffic accidents, the XGBoost model is employed to analyze feature importance. Specifically, the Weight method is applied to measure how frequently each feature <italic>f</italic><sub><italic>i</italic></sub> appears as a split node, which serves as an indicator of its importance. The calculation formula is as follows:</p>
<disp-formula id="E1"><label>(1)</label><mml:math id="M1"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mi>W</mml:mi><mml:mi>e</mml:mi><mml:mi>i</mml:mi><mml:mi>g</mml:mi><mml:mi>h</mml:mi><mml:msub><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:munderover accentunder="false" accent="false"><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>T</mml:mi></mml:mrow></mml:munderover></mml:mstyle><mml:mi>c</mml:mi><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>n</mml:mi><mml:mi>t</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>f</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mtext>&#x000A0;</mml:mtext><mml:mi>i</mml:mi><mml:mi>n</mml:mi><mml:mtext>&#x000A0;</mml:mtext><mml:mi>t</mml:mi><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mi>e</mml:mi><mml:mtext>&#x000A0;</mml:mtext><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>where <italic>T</italic> is the total number of trees; <italic>count</italic>(<italic>f</italic><sub><italic>i</italic></sub> <italic>in tree t</italic>) represents the number of times; feature <italic>f</italic><sub><italic>i</italic></sub> is used to split a node in tree <italic>t</italic>.</p>
<p>As shown in <xref ref-type="fig" rid="F4">Figure 4</xref>, real-time vehicle speed and vehicle alarm information are the most influential predictors, indicating that dynamic driving behavior and real-time vehicle diagnostics play a critical role in accident occurrence. Historical accident frequency ranks next, as it reflects the unresolved high-risk factors in specific temporal and spatial contexts. Road type and weather conditions have a moderate impact, suggesting that the infrastructure and environmental factors can influence accident risk. Due to lacking direct correlation with real-time risk factors , historical accident types have the weakest effect. Above all, these findings help clarify the relative importance of accident-related features and provide a basis for selecting input parameters in accident risk prediction.</p>
<fig position="float" id="F4">
<label>Figure 4</label>
<caption><p>Feature importance ranking of accident predictors from XGBoost modeling.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frsc-07-1649853-g0004.tif">
<alt-text>Bar chart showing feature importance with six features. Real-time vehicle speed has the highest importance score, followed by vehicle alarm information, historical accident frequency, road type, weather condition, and historical accident types. Scores range from zero to over three hundred fifty.</alt-text>
</graphic>
</fig>
</sec>
</sec>
<sec id="s3">
<title>3 Method</title>
<p>This study proposes a prediction model for new energy vehicle accident risk based on Long Short-Term Memory (LSTM) networks. The model inputs include time-series data (such as weather, road conditions, vehicle speed) and static accident history features (such as vehicle historical accident types). The model output is the accident risk probability, which reflects the likelihood of a vehicle experiencing an accident within a certain future period. The model utilizes LSTM layers to process time-series features and fully connected layers to handle static features, capturing complex temporal dependencies and long-term trends during vehicle operation.</p>
<sec>
<title>3.1 Introduction to LSTM</title>
<p>Long Short-Term Memory (LSTM) networks are a type of recurrent neural network (RNN) architecture designed for time-series data. They are remembering both long-term and short-term information, addressing the problem of traditional RNNs being unable to capture long-term dependencies in sequences (<xref ref-type="bibr" rid="B16">Hochreiter and Schmidhuber, 1997</xref>). The structure of the LSTM network unit is shown in <xref ref-type="fig" rid="F5">Figure 5</xref>.</p>
<fig position="float" id="F5">
<label>Figure 5</label>
<caption><p>Schematic diagram of the LSTM network unit structure.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frsc-07-1649853-g0005.tif">
<alt-text>Diagram of an LSTM cell, showing the flow of information. Inputs include Ct-1, Ht-1, and It. Key components are forget gate ft, input gate it, and output gate ot. Operations involve multiplication, addition, and activation functions &#x003C3;, tanh). Outputs are Ct and Ht.</alt-text>
</graphic>
</fig>
<p>The LSTM network consists of multiple identical units, each containing four key components: the input gate, forget gate, output gate, and cell state. The input gate controls which information is added to the cell state, the forget gate determines which information is discarded, and the output gate regulates the contribution of the cell state to the output. The cell state serves as the memory component, storing long-term dependencies. Each gate is governed by the following equations:</p>
<disp-formula id="E2"><label>(2)</label><mml:math id="M2"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mi>g</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mi>&#x003C3;</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>W</mml:mi></mml:mrow><mml:mrow><mml:mi>x</mml:mi></mml:mrow></mml:msub><mml:mo>&#x0002B;</mml:mo><mml:mi>b</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>Where &#x003C3; the sigmoid function; <italic>x</italic> is the input; <italic>W</italic> is the weight matrix; and <italic>b</italic> represents the bias term.</p>
<p>The sigmoid function maps the raw values to a range between 0 and 1, enabling it to effectively control the flow of information. Each LSTM network unit has a corresponding memory cell at each time step, whose responsibility is to retain information from the past sequence. LSTM can adjust the amount of information passed at each time step through the gating mechanism, to effectively update the current memory cell state. This ensures that the model can maintain long-term dependencies while avoiding problems of vanishing or exploding gradients.</p>
<p>Given the input sequence be (<italic>x</italic><sub>1</sub>, <italic>x</italic><sub>2</sub>, &#x022EF;&#x02009;, <italic>x</italic><sub><italic>T</italic></sub>) and the hidden state (<italic>h</italic><sub>1</sub>, <italic>h</italic><sub>2</sub>, &#x022EF;&#x02009;, <italic>h</italic><sub><italic>T</italic></sub>). The flow steps for an LSTM network unit at time stepare as follows:</p>
<list list-type="simple">
<list-item><p>(1) Data Input: The forget gate computes the output <italic>f</italic><sub><italic>t</italic></sub> by using the hidden state output from the previous time step <italic>h</italic><sub><italic>t</italic>&#x02212;1</sub> and the current input <italic>x</italic><sub><italic>t</italic></sub> to manage the degree of information retention. The calculation formula for <italic>f</italic><sub><italic>t</italic></sub> is as follows:
<disp-formula id="E3"><label>(3)</label><mml:math id="M3"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>f</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi>&#x003C3;</mml:mi><mml:mrow><mml:mo stretchy="true">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>W</mml:mi></mml:mrow><mml:mrow><mml:mi>f</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo>[</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>]</mml:mo></mml:mrow><mml:mo>&#x0002B;</mml:mo><mml:msub><mml:mrow><mml:mi>b</mml:mi></mml:mrow><mml:mrow><mml:mi>f</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="true">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula></p></list-item>
<list-item><p>(2) Memory Selection: First, <italic>h</italic><sub><italic>t</italic>&#x02212;1</sub> and <italic>x</italic><sub><italic>t</italic></sub> are passed through the input gate to determine the information that needs to be updated, denoted as <italic>i</italic><sub><italic>t</italic></sub>. Then, <italic>h</italic><sub><italic>t</italic>&#x02212;1</sub> and <italic>x</italic><sub><italic>t</italic></sub> are processed through the tanh function to obtain the candidate memory state <inline-formula><mml:math id="M4"><mml:msub><mml:mrow><mml:mover accent="true"><mml:mrow><mml:mi>C</mml:mi></mml:mrow><mml:mo>&#x0007E;</mml:mo></mml:mover></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>. Finally, the memory cell is updated <italic>f</italic><sub><italic>t</italic></sub><italic>C</italic><sub><italic>t</italic>&#x02212;1</sub> represents the information to be forgotten, while <inline-formula><mml:math id="M5"><mml:msub><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:msub><mml:mrow><mml:mover accent="true"><mml:mrow><mml:mi>C</mml:mi></mml:mrow><mml:mo>&#x0007E;</mml:mo></mml:mover></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> represents the new candidate memory state. The sum of these two gives <italic>C</italic><sub><italic>t</italic></sub>, which is the memory state at time step <italic>t</italic>. The calculation formulas are as follows:
<disp-formula id="E4"><label>(4)</label><mml:math id="M6"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>C</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mrow><mml:mi>f</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:msub><mml:mrow><mml:mi>C</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>&#x0002B;</mml:mo><mml:msub><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mover accent="true"><mml:mrow><mml:msub><mml:mrow><mml:mi>C</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>&#x0007E;</mml:mo></mml:mover></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<disp-formula id="E5"><label>(5)</label><mml:math id="M7"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi>&#x003C3;</mml:mi><mml:mrow><mml:mo stretchy="true">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>W</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo>[</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>]</mml:mo></mml:mrow><mml:mo>&#x0002B;</mml:mo><mml:msub><mml:mrow><mml:mi>b</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="true">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<disp-formula id="E6"><label>(6)</label><mml:math id="M8"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mover accent="true"><mml:mrow><mml:msub><mml:mrow><mml:mi>C</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>&#x0007E;</mml:mo></mml:mover><mml:mo>=</mml:mo><mml:mo class="qopname">tanh</mml:mo><mml:mrow><mml:mo stretchy="true">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>W</mml:mi></mml:mrow><mml:mrow><mml:mi>c</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo>[</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>]</mml:mo></mml:mrow><mml:mo>&#x0002B;</mml:mo><mml:msub><mml:mrow><mml:mi>b</mml:mi></mml:mrow><mml:mrow><mml:mi>c</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="true">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula></p></list-item>
<list-item><p>(3) Data Output: Similar to the forget gate, the output gate computes the result by using <italic>h</italic><sub><italic>t</italic>&#x02212;1</sub> and <italic>x</italic><sub><italic>t</italic></sub> to obtain <italic>O</italic><sub><italic>t</italic></sub>. However, <italic>O</italic><sub><italic>t</italic></sub> is multiplied by the tanh function applied to the current memory state <italic>C</italic><sub><italic>t</italic></sub> to produce the current hidden state <italic>h</italic><sub><italic>t</italic></sub>.
<disp-formula id="E7"><label>(7)</label><mml:math id="M9"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>O</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi>&#x003C3;</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>W</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo>[</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>]</mml:mo></mml:mrow><mml:mo>&#x0002B;</mml:mo><mml:msub><mml:mrow><mml:mi>b</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<disp-formula id="E8"><label>(8)</label><mml:math id="M10"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mrow><mml:mrow><mml:mi mathvariant="script">O</mml:mi></mml:mrow></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo class="qopname">tanh</mml:mo><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>C</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula></p>
<p>Where <italic>W</italic><sub><italic>f</italic></sub>, <italic>W</italic><sub><italic>i</italic></sub>, <italic>W</italic><sub><italic>c</italic></sub>, <italic>W</italic><sub><italic>o</italic></sub> represent the weight matrices, and <italic>b</italic><sub><italic>f</italic></sub>, <italic>b</italic><sub><italic>i</italic></sub>, <italic>b</italic><sub><italic>c</italic></sub>, <italic>b</italic><sub>0</sub> represent the bias terms. &#x003C3; represents the sigmoid activation function.</p></list-item>
</list>
</sec>
<sec>
<title>3.2 Overall model structure</title>
<p>The structure of the new energy vehicle accident risk prediction model based on dynamic-static feature fusion is shown in <xref ref-type="fig" rid="F5">Figure 5</xref>. The model mainly consists of the LSTM layer, a fully connected layer for static features, a fusion layer, and an output layer. First, the model processes the time-series inputs, such as vehicle speed, alarm information, and road type, through the LSTM layer to extract temporal dependency features. The LSTM layer processes the input data step by step by a multi-unit structure, to learn the dynamic patterns during the vehicle&#x00027;s operation. Meanwhile, static features, such as historical accident frequency and severity, are processed through an independent fully connected (Dense) layer, generating a fixed feature vector to quantify and capture the vehicle&#x00027;s potential accident risk characteristics. Subsequently, the dynamic features extracted from the LSTM layer and the static feature representation are fused at each time step, forming a joint vector containing both temporal and static features. This joint vector is then input into a multi-layer fully connected network, and the sigmoid activation function generates the risk probability of a future accident occurring for the vehicle. The formal definition of the network structure is as follows: The time-series input <inline-formula><mml:math id="M11"><mml:msub><mml:mrow><mml:mi>X</mml:mi></mml:mrow><mml:mrow><mml:mi>s</mml:mi><mml:mi>e</mml:mi><mml:mi>q</mml:mi></mml:mrow></mml:msub><mml:mo>&#x02208;</mml:mo><mml:msup><mml:mrow><mml:mi>&#x0211D;</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>&#x000D7;</mml:mo><mml:mi>F</mml:mi></mml:mrow></mml:msup></mml:math></inline-formula> is processed through the LSTM layer to obtain a hidden state vector <inline-formula><mml:math id="M12"><mml:msub><mml:mrow><mml:mstyle mathvariant="bold"><mml:mtext>h</mml:mtext></mml:mstyle></mml:mrow><mml:mrow><mml:mi>L</mml:mi><mml:mi>S</mml:mi><mml:mi>T</mml:mi><mml:mi>M</mml:mi></mml:mrow></mml:msub><mml:mo>&#x02208;</mml:mo><mml:mtext>&#x000A0;</mml:mtext><mml:msup><mml:mrow><mml:mi>&#x0211D;</mml:mi></mml:mrow><mml:mrow><mml:mi>H</mml:mi></mml:mrow></mml:msup></mml:math></inline-formula></p>
<disp-formula id="E9"><label>(9)</label><mml:math id="M13"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mstyle mathvariant="bold"><mml:mtext>h</mml:mtext></mml:mstyle></mml:mrow><mml:mrow><mml:mi>L</mml:mi><mml:mi>S</mml:mi><mml:mi>T</mml:mi><mml:mi>M</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi>L</mml:mi><mml:mi>S</mml:mi><mml:mi>T</mml:mi><mml:msub><mml:mrow><mml:mi>M</mml:mi></mml:mrow><mml:mrow><mml:mi>H</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>X</mml:mi></mml:mrow><mml:mrow><mml:mi>s</mml:mi><mml:mi>e</mml:mi><mml:mi>q</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>Where <italic>H</italic> represents the output dimension of the LSTM layer, denoted as <italic>LSTM</italic><sub><italic>H</italic></sub>. The static input <inline-formula><mml:math id="M14"><mml:msub><mml:mrow><mml:mstyle mathvariant="bold"><mml:mtext>X</mml:mtext></mml:mstyle></mml:mrow><mml:mrow><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msub><mml:mo>&#x02208;</mml:mo><mml:msup><mml:mrow><mml:mi>&#x0211D;</mml:mi></mml:mrow><mml:mrow><mml:mi>S</mml:mi></mml:mrow></mml:msup></mml:math></inline-formula> is then mapped to a D-dimensional vector <inline-formula><mml:math id="M15"><mml:msub><mml:mrow><mml:mstyle mathvariant="bold"><mml:mtext>h</mml:mtext></mml:mstyle></mml:mrow><mml:mrow><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msub><mml:mo>&#x02208;</mml:mo><mml:msup><mml:mrow><mml:mi>&#x0211D;</mml:mi></mml:mrow><mml:mrow><mml:mi>D</mml:mi></mml:mrow></mml:msup></mml:math></inline-formula> through a fully connected (Dense) layer</p>
<disp-formula id="E10"><label>(10)</label><mml:math id="M16"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mstyle mathvariant="bold"><mml:mtext>h</mml:mtext></mml:mstyle></mml:mrow><mml:mrow><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi>R</mml:mi><mml:mi>e</mml:mi><mml:mi>L</mml:mi><mml:mi>U</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mstyle mathvariant="bold"><mml:mtext>W</mml:mtext></mml:mstyle></mml:mrow><mml:mrow><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msub><mml:msub><mml:mrow><mml:mstyle mathvariant="bold"><mml:mtext>X</mml:mtext></mml:mstyle></mml:mrow><mml:mrow><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msub><mml:mo>&#x0002B;</mml:mo><mml:msub><mml:mrow><mml:mstyle mathvariant="bold"><mml:mtext>b</mml:mtext></mml:mstyle></mml:mrow><mml:mrow><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>Where <inline-formula><mml:math id="M17"><mml:msub><mml:mrow><mml:mstyle mathvariant="bold"><mml:mtext>W</mml:mtext></mml:mstyle></mml:mrow><mml:mrow><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msub><mml:mo>&#x02208;</mml:mo><mml:msup><mml:mrow><mml:mi>&#x0211D;</mml:mi></mml:mrow><mml:mrow><mml:mi>D</mml:mi><mml:mo>&#x000D7;</mml:mo><mml:mi>s</mml:mi></mml:mrow></mml:msup></mml:math></inline-formula> and <inline-formula><mml:math id="M18"><mml:msub><mml:mrow><mml:mstyle mathvariant="bold"><mml:mtext>b</mml:mtext></mml:mstyle></mml:mrow><mml:mrow><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msub><mml:mo>&#x02208;</mml:mo><mml:msup><mml:mrow><mml:mi>&#x0211D;</mml:mi></mml:mrow><mml:mrow><mml:mi>D</mml:mi></mml:mrow></mml:msup></mml:math></inline-formula> are the weight matrix and bias vector of the fully connected layer. Then, the output of the LSTM layer <inline-formula><mml:math id="M19"><mml:msub><mml:mrow><mml:mstyle mathvariant="bold"><mml:mtext>h</mml:mtext></mml:mstyle></mml:mrow><mml:mrow><mml:mi>L</mml:mi><mml:mi>S</mml:mi><mml:mi>T</mml:mi><mml:mi>M</mml:mi></mml:mrow></mml:msub><mml:mo>&#x02208;</mml:mo><mml:msup><mml:mrow><mml:mi>&#x0211D;</mml:mi></mml:mrow><mml:mrow><mml:mi>H</mml:mi></mml:mrow></mml:msup></mml:math></inline-formula> and the static feature representation <inline-formula><mml:math id="M20"><mml:msub><mml:mrow><mml:mstyle mathvariant="bold"><mml:mtext>h</mml:mtext></mml:mstyle></mml:mrow><mml:mrow><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msub><mml:mo>&#x02208;</mml:mo><mml:msup><mml:mrow><mml:mi>&#x0211D;</mml:mi></mml:mrow><mml:mrow><mml:mi>D</mml:mi></mml:mrow></mml:msup></mml:math></inline-formula> are concatenated together to form a joint vector <inline-formula><mml:math id="M21"><mml:msub><mml:mrow><mml:mstyle mathvariant="bold"><mml:mtext>h</mml:mtext></mml:mstyle></mml:mrow><mml:mrow><mml:mi>c</mml:mi><mml:mi>o</mml:mi><mml:mi>n</mml:mi><mml:mi>c</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>&#x02208;</mml:mo><mml:msup><mml:mrow><mml:mi>&#x0211D;</mml:mi></mml:mrow><mml:mrow><mml:mi>H</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mi>D</mml:mi></mml:mrow></mml:msup></mml:math></inline-formula></p>
<disp-formula id="E11"><label>(11)</label><mml:math id="M22"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mstyle mathvariant="bold"><mml:mtext>h</mml:mtext></mml:mstyle></mml:mrow><mml:mrow><mml:mi>c</mml:mi><mml:mi>o</mml:mi><mml:mi>n</mml:mi><mml:mi>c</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi>C</mml:mi><mml:mi>o</mml:mi><mml:mi>n</mml:mi><mml:mi>c</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>e</mml:mi><mml:mi>n</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>e</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mstyle mathvariant="bold"><mml:mtext>h</mml:mtext></mml:mstyle></mml:mrow><mml:mrow><mml:mi>L</mml:mi><mml:mi>S</mml:mi><mml:mi>T</mml:mi><mml:mi>M</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mstyle mathvariant="bold"><mml:mtext>h</mml:mtext></mml:mstyle></mml:mrow><mml:mrow><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>The joint feature vector passes through a fully connected layer with a sigmoid activation function to obtain the output value, which represents the risk probability</p>
<disp-formula id="E12"><label>(12)</label><mml:math id="M23"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mover accent='true'><mml:mi>y</mml:mi><mml:mo>&#x0005E;</mml:mo></mml:mover><mml:mo>=</mml:mo><mml:mi>&#x003C3;</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mstyle mathvariant="bold"><mml:mtext>W</mml:mtext></mml:mstyle></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:msub><mml:mrow><mml:mstyle mathvariant="bold"><mml:mtext>W</mml:mtext></mml:mstyle></mml:mrow><mml:mrow><mml:mi>c</mml:mi><mml:mi>o</mml:mi><mml:mi>n</mml:mi><mml:mi>c</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>&#x0002B;</mml:mo><mml:msub><mml:mrow><mml:mstyle mathvariant="bold"><mml:mtext>b</mml:mtext></mml:mstyle></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>where &#x003C3; represents the sigmoid function, and <inline-formula><mml:math id="M24"><mml:msub><mml:mrow><mml:mstyle mathvariant="bold"><mml:mtext>W</mml:mtext></mml:mstyle></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>&#x02208;</mml:mo><mml:msup><mml:mrow><mml:mi>&#x0211D;</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>&#x000D7;</mml:mo><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>H</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mi>D</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow></mml:msup></mml:math></inline-formula> and <bold>b</bold><sub><italic>out</italic></sub> &#x02208; &#x0211D; are the weight matrix and bias vector of the output layer. The loss function uses binary cross-entropy to evaluate the deviation between the predicted risk probability and the true label (<xref ref-type="bibr" rid="B34">Shannon, 1948</xref>). Assuming the true label is <italic>y</italic> &#x02208; {0, 1} and the predicted risk probability is &#x00177; &#x02208; (0, 1), the binary cross-entropy loss is calculated as follows:</p>
<disp-formula id="E13"><label>(13)</label><mml:math id="M25"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mi>L</mml:mi><mml:mo>=</mml:mo><mml:mo>-</mml:mo><mml:mfrac><mml:mrow><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>N</mml:mi></mml:mrow></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover accentunder="false" accent="false"><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>N</mml:mi></mml:mrow></mml:munderover></mml:mstyle><mml:mrow><mml:mo>[</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo class="qopname">log</mml:mo><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mover accent="true"><mml:mrow><mml:msub><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo class="qopname">^</mml:mo></mml:mover></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>&#x0002B;</mml:mo><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msub><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo class="qopname">log</mml:mo><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:mover accent="true"><mml:mrow><mml:msub><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo class="qopname">^</mml:mo></mml:mover></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mo>]</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>Where <italic>N</italic> represents the number of samples, <italic>y</italic><sub><italic>i</italic></sub> is the true label of the <italic>i</italic> &#x02212; th sample, and &#x00177; is the predicted probability for the <italic>i</italic> &#x02212; th sample. The loss function penalizes incorrectly classified probabilities, guiding the model to update its weights and improve prediction accuracy.</p>
</sec>
<sec>
<title>3.3 Model prediction process</title>
<p>The overall prediction process of the proposed new energy vehicle accident risk prediction model based on dynamic-static feature fusion is shown in <xref ref-type="fig" rid="F6">Figure 6</xref>. The model mainly consists of three components: the data preprocessing module, the model training module, and the detection module.</p>
<list list-type="simple">
<list-item><p>(1) Data Preprocessing Module: The raw data tables are linked using VIN and license plate numbers, with invalid data being removed. To enhance model training effectiveness and data consistency, all input features are normalized. weather, road type, alarm information, and historical accident types are encoded using one-hot encoding, while speed is normalized to the range [0,1]. In inconsistent data frequencies (1 Hz under fault conditions and every 30 s under normal conditions), a sliding window is used to ensure consistent time frame structures for time-series features across different data frequencies. In cases of low-frequency data, linear interpolation is applied within the window to ensure effective data input at each time step. A window from 20 to 10 s before the accident record time is selected as the input for predicting whether the accident will occur.</p></list-item>
<list-item><p>(2) Model Training Module: The preprocessed training data is fed into the network model for training, and the accident risk prediction model is generated by iteratively optimizing the model using the cross-entropy loss function. The structure of the prediction model is shown in <xref ref-type="fig" rid="F7">Figure 7</xref>. The traffic accidents predicted in this study include both minor and severe incidents. All accident records were sourced from user-reported data, either through self-registration via a mobile application or through formal emergency reporting.</p></list-item>
<list-item><p>(3) Risk Prediction Module: The risk prediction module inputs the preprocessed test data into the trained accident risk prediction model. The model performance is assessed by comparing the prediction results with the actual outcomes.</p></list-item>
</list>
<fig position="float" id="F6">
<label>Figure 6</label>
<caption><p>The prediction process of new energy vehicle accident risk prediction model.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frsc-07-1649853-g0006.tif">
<alt-text>Flowchart depicting a system for accident prediction. It includes three modules: Data Preprocessing, Prediction and Evaluation, and Model Training. Data Preprocessing covers steps from raw data to a standard dataset. Prediction and Evaluation involve testing predictions against actual results to determine recall, accuracy, and precision. Model Training utilizes a training set with an LSTM layer, fully connected layer, ReLU activation, and loss backpropagation to produce predicted values.</alt-text>
</graphic>
</fig>
<fig position="float" id="F7">
<label>Figure 7</label>
<caption><p>The structure of the new energy vehicle accident risk prediction mode.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frsc-07-1649853-g0007.tif">
<alt-text>Diagram illustrating a machine learning model architecture with four sections. The top left shows input features divided into static and sequential inputs with ReLU and LSTM processing. The top right depicts vector concatenation and matrix operations, including multiplication and ReLU activation. The bottom left visualizes LSTM layers with inputs, forget gates, and outputs. The bottom right displays a fully connected network with input, hidden, and output layers, showing connections between neurons.</alt-text>
</graphic>
</fig>
</sec>
</sec>
<sec id="s4">
<title>4 Results and discussion</title>
<sec>
<title>4.1 Evaluation metrics</title>
<p>After the model is constructed, its performance needs to be evaluated. Accident prediction is essentially a binary classification task. For binary classification problems, there are four possible outcomes:</p>
<list list-type="simple">
<list-item><p>True Positive (TP): The actual class is positive, and the prediction is also positive, meaning accident cases are accurately identified as accidents.</p></list-item>
<list-item><p>False Positive (FP): The actual class is negative, but the prediction is positive, referring to non-accident cases that are misclassified as accidents.</p></list-item>
<list-item><p>True Negative (TN): The actual class is negative, and the prediction is also negative, meaning non-accident instances are accurately predicted as non-accidents.</p></list-item>
<list-item><p>False Negative (FN): The actual class is positive, but the prediction is negative, referring to accident cases that are misidentified as non-accidents.</p></list-item>
</list>
<p>To evaluate the performance of the proposed model, Accuracy (Acc), Precision, Recall, and F1 Score are adopted as evaluation metrics.</p>
<list list-type="simple">
<list-item><p>(1) Accuracy represents the ratio of correctly classified samples to the total number of samples
<disp-formula id="E14"><label>(14)</label><mml:math id="M26"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mi>A</mml:mi><mml:mi>c</mml:mi><mml:mi>c</mml:mi><mml:mi>u</mml:mi><mml:mi>r</mml:mi><mml:mi>a</mml:mi><mml:mi>c</mml:mi><mml:mi>y</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mi>T</mml:mi><mml:mi>N</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mi>F</mml:mi><mml:mi>N</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mi>F</mml:mi><mml:mi>P</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mi>T</mml:mi><mml:mi>N</mml:mi></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula></p></list-item>
<list-item><p>(2) Recall means the proportion of actual positive samples that the classifier correctly predicts as positive
<disp-formula id="E15"><label>(15)</label><mml:math id="M27"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mi>R</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi><mml:mi>a</mml:mi><mml:mi>l</mml:mi><mml:mi>l</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mi>F</mml:mi><mml:mi>N</mml:mi></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula></p></list-item>
<list-item><p>(3) Precision denotes the proportion of true positive samples among the positive samples identified by the classifier
<disp-formula id="E16"><label>(16)</label><mml:math id="M28"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mi>P</mml:mi><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi><mml:mi>i</mml:mi><mml:mi>s</mml:mi><mml:mi>i</mml:mi><mml:mi>o</mml:mi><mml:mi>n</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mi>F</mml:mi><mml:mi>P</mml:mi></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula></p></list-item>
<list-item><p>(4) F1 Score: To balance precision and recall, researchers proposed another evaluation metric&#x02014;the F-score (F1 Score). Its general form is <italic>F</italic><sub>&#x003B2;</sub>, as shown in <xref ref-type="disp-formula" rid="E16">Equation 16</xref>.
<disp-formula id="E17"><label>(17)</label><mml:math id="M29"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>F</mml:mi></mml:mrow><mml:mrow><mml:mi>&#x003B2;</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mn>1</mml:mn><mml:mo>&#x0002B;</mml:mo><mml:msup><mml:mrow><mml:mi>&#x003B2;</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msup></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mi>P</mml:mi><mml:mi>R</mml:mi></mml:mrow><mml:mrow><mml:msup><mml:mrow><mml:mi>&#x003B2;</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msup><mml:mi>P</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mi>R</mml:mi></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula></p>
<p>Where <italic>p</italic> represents precision, and <italic>R</italic> denotes recall. The setting of &#x003B2; allows for different weights to be assigned to recall and precision. When &#x003B2; &#x0003E; 1, recall has a greater impact; when 0 &#x0003C; &#x003B2; &#x0003C; 1, precision has a greater impact. In practical tests, both precision and recall are equally important, so &#x003B2; is typically set to 1. Consequently, <xref ref-type="disp-formula" rid="E16">Equation 16</xref> simplifies to <xref ref-type="disp-formula" rid="E17">Equation 17</xref>, representing the widely used F1 score. The F1 score generally ranges from 0 to 1, with higher values indicating better algorithm performance.
<disp-formula id="E18"><label>(18)</label><mml:math id="M30"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>F</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mn>2</mml:mn><mml:mi>P</mml:mi><mml:mi>R</mml:mi></mml:mrow><mml:mrow><mml:mi>P</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mi>R</mml:mi></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula></p></list-item>
<list-item><p>(5) False Negative Rate (FNR): The false negative rate indicates the proportion of actual incidents that the system fails to detect. A low FNR is critical for ensuring user trust and system safety. It can be calculated as:
<disp-formula id="E19"><label>(19)</label><mml:math id="M31"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mi>F</mml:mi><mml:mi>R</mml:mi><mml:mi>N</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>F</mml:mi><mml:mi>N</mml:mi></mml:mrow><mml:mrow><mml:mi>F</mml:mi><mml:mi>P</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mi>F</mml:mi><mml:mi>N</mml:mi></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula></p></list-item>
<list-item><p>(6) Area Under the Receiver Operating Characteristic Curve (AUC): The AUC represents the model&#x00027;s ability to distinguish between positive and negative classes across all possible thresholds. An AUC of 1.0 indicates a perfect classifier, while 0.5 suggests no discriminative ability. The ROC curve plots the True Positive Rate (TPR) against the False Positive Rate (FPR) at various threshold settings. Specifically:
<disp-formula id="E20"><label>(20)</label><mml:math id="M32"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mi>R</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mi>F</mml:mi><mml:mi>N</mml:mi></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<disp-formula id="E21"><label>(21)</label><mml:math id="M33"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mi>F</mml:mi><mml:mi>P</mml:mi><mml:mi>R</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>F</mml:mi><mml:mi>P</mml:mi></mml:mrow><mml:mrow><mml:mi>F</mml:mi><mml:mi>P</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mi>T</mml:mi><mml:mi>N</mml:mi></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula></p>
<p>The AUC is the area under the ROC curve, which can be computed as the integral of the ROC curve:
<disp-formula id="E22"><label>(22)</label><mml:math id="M34"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mi>A</mml:mi><mml:mi>U</mml:mi><mml:mi>C</mml:mi><mml:mo>=</mml:mo><mml:msubsup><mml:mrow><mml:mo>&#x0222B;</mml:mo></mml:mrow><mml:mrow><mml:mn>0</mml:mn></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msubsup><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mi>R</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>F</mml:mi><mml:mi>P</mml:mi><mml:mi>R</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mi>d</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>F</mml:mi><mml:mi>P</mml:mi><mml:mi>R</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula></p>
<p>Moreover, The AUC can also be approximated by numerical integration methods using discrete points on the ROC curve:
<disp-formula id="E23"><label>(23)</label><mml:math id="M35"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mi>A</mml:mi><mml:mi>U</mml:mi><mml:mi>C</mml:mi><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:munderover accentunder="false" accent="false"><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>n</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:munderover></mml:mstyle><mml:mfrac><mml:mrow><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:msub><mml:mrow><mml:mi>R</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>&#x0002B;</mml:mo><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:msub><mml:mrow><mml:mi>R</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:mfrac><mml:mo>&#x000D7;</mml:mo><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>F</mml:mi><mml:mi>P</mml:mi><mml:msub><mml:mrow><mml:mi>R</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:mi>F</mml:mi><mml:mi>P</mml:mi><mml:msub><mml:mrow><mml:mi>R</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula></p>
<p>where <italic>n</italic> is the number of points on the ROC curve. The AUC ranges from 0 to 1, with values closer to 1 indicating better classification performance.</p>
</list-item>
</list>
</sec>
<sec>
<title>4.2 Dataset and experimental setup</title>
<p>This experiment selects a portion of the 2021 accident data and non-accident data at a 1:5 ratio, constructing a dataset containing 7,386 records. The dataset is divided into a training set and a test set at a ratio of 8:2. The experiment is conducted using the Python 3.8 programming platform and the Pytorch 2.0.1 framework. The model was trained using the Adam optimizer with an initial learning rate of 0.001. A batch size of 32 was employed, and the training was conducted for a total of 100 epochs.</p>
<p>To obtain the optimal LSTM network parameters, grid search is used to evaluate prediction accuracy under different combinations of LSTM layer depth and hidden size. As shown in <xref ref-type="fig" rid="F8">Figure 8</xref>, the highest validation accuracy of 85.4% is achieved with two LSTM layers, each containing 64 hidden units. However, continuously increasing the number of layers (beyond two) or hidden units (e.g., 256) does not lead to further improvement and may slightly reduce performance, likely due to overfitting. These results suggest that moderately deep and well-balanced architecture is most suitable for modeling dynamic accident risk in new energy vehicles.</p>
<fig position="float" id="F8">
<label>Figure 8</label>
<caption><p>Validation accuracy of LSTM architectures with varying depth and hidden units.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frsc-07-1649853-g0008.tif">
<alt-text>Line graph titled &#x0201C;Grid Search of LSTM Layers and Hidden Sizes&#x0201D; showing accuracy versus hidden size. Three lines represent different LSTM layers: one layer (blue), two layers (orange), and three layers (green). Accuracy peaks at hidden size sixty-four for each configuration before declining.</alt-text>
</graphic>
</fig>
</sec>
<sec>
<title>4.3 Experimental results and analysis</title>
<p>As shown in <xref ref-type="fig" rid="F9">Figure 9</xref>, the training loss decreases rapidly during the initial epochs, dropping from approximately 1.02 to below 0.3, indicating that the model quickly learns meaningful feature representations at an early stage. As training continues, the loss gradually declines and stabilizes around 0.13 after about 60 epochs, suggesting a stable training process without significant oscillations or signs of overfitting. It is worth noting that the loss curve exhibits some fluctuations between epochs 10 and 40, which may be caused by factors such as optimizer hyperparameters (e.g., learning rate) or gradient noise from mini-batch training. However, these variations are minor and diminish in later stages, demonstrating good overall convergence.</p>
<fig position="float" id="F9">
<label>Figure 9</label>
<caption><p>The training loss of the proposed model over epochs.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frsc-07-1649853-g0009.tif">
<alt-text>Line graph showing the decrease in loss over 100 epochs. The vertical axis represents loss, decreasing from 1.0 to approximately 0.1. The horizontal axis represents epochs. The line shows a rapid decline initially, then gradually stabilizes.</alt-text>
</graphic>
</fig>
<p><xref ref-type="fig" rid="F10">Figure 10</xref> illustrates the trend of training accuracy over epochs. In the early stages, accuracy increases significantly from approximately 0.42 to around 0.70, indicating that the model quickly learns key discriminative patterns. As training progresses, accuracy continues to improve gradually and begins to plateau after about 60 epochs, eventually stabilizing at around 0.82.</p>
<fig position="float" id="F10">
<label>Figure 10</label>
<caption><p>The training accuracy of the proposed model over epochs.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frsc-07-1649853-g0010.tif">
<alt-text>Line graph showing model accuracy over 100 epochs. Accuracy starts at 0.40 and increases steeply, leveling around 0.75, and fluctuates slightly before reaching close to 0.80.</alt-text>
</graphic>
</fig>
<p>The consistent improvement and eventual convergence in accuracy closely align with the trend observed in the loss curve, further confirming the effectiveness and stability of the training process. Additionally, the absence of accuracy degradation indicates that the model does not exhibit signs of overfitting during training.</p>
<p>To evaluate the effectiveness of temporal modeling and feature integration, we compared our proposed LSTM-based approach with several classical machine learning models, including Random Forest, Support Vector Machine (SVM), and XGBoost. As summarized in <xref ref-type="table" rid="T4">Table 4</xref>, XGBoost achieves relatively high performance with an accuracy of 84.1%, F1-score of 82.99%, and an AUC of 0.875. This indicates that tree-based ensemble methods can efficiently exploit static and momentary dynamic features to make accurate predictions.</p>
<table-wrap position="float" id="T4">
<label>Table 4</label>
<caption><p>Performance comparison of different models for NEV accident risk prediction.</p></caption>
<table frame="box" rules="all">
<thead>
<tr style="background-color:#919498;color:#ffffff">
<th valign="top" align="left"><bold>Model</bold></th>
<th valign="top" align="left"><bold>Feature input</bold></th>
<th valign="top" align="center"><bold>Accuracy</bold></th>
<th valign="top" align="center"><bold>Recall</bold></th>
<th valign="top" align="center"><bold>Precision</bold></th>
<th valign="top" align="center"><bold>F1 score</bold></th>
<th valign="top" align="center"><bold>FNR</bold></th>
<th valign="top" align="center"><bold>AUC</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">RF</td>
<td valign="top" align="left">Dynamic-static</td>
<td valign="top" align="center">81.3%</td>
<td valign="top" align="center">82.2%</td>
<td valign="top" align="center">80.4%</td>
<td valign="top" align="center">81.3%</td>
<td valign="top" align="center">17.8%</td>
<td valign="top" align="center">0.849</td>
</tr>
<tr>
<td valign="top" align="left">SVM</td>
<td valign="top" align="left">Dynamic-static</td>
<td valign="top" align="center">56.3%</td>
<td valign="top" align="center">53.5%</td>
<td valign="top" align="center">60.2%</td>
<td valign="top" align="center">56.7%</td>
<td valign="top" align="center">46.5%</td>
<td valign="top" align="center">0.607</td>
</tr>
<tr>
<td valign="top" align="left">XGBoost</td>
<td valign="top" align="left">Dynamic-static</td>
<td valign="top" align="center">84.1%</td>
<td valign="top" align="center">82.2%</td>
<td valign="top" align="center">83.7%</td>
<td valign="top" align="center">82.9%</td>
<td valign="top" align="center">17.8%</td>
<td valign="top" align="center">0.875</td>
</tr>
<tr>
<td valign="top" align="left">Proposed</td>
<td valign="top" align="left">Dynamic-static</td>
<td valign="top" align="center">85.4%</td>
<td valign="top" align="center">82.9%</td>
<td valign="top" align="center">84.5%</td>
<td valign="top" align="center">83.7%</td>
<td valign="top" align="center">17.1%</td>
<td valign="top" align="center">0.891</td>
</tr></tbody>
</table>
</table-wrap>
<p>However, XGBoost lacks the ability to capture temporal dependencies, which limits its performance in scenarios involving evolving risk over time. In contrast, the LSTM-based model demonstrates superior capability in modeling sequential patterns. By learning from historical behavior trajectories, LSTM enhances the model&#x00027;s sensitivity to risk fluctuations and improves real-time accident prediction.</p>
<p>As shown in <xref ref-type="table" rid="T4">Table 4</xref>, the proposed dynamic-static feature fusion LSTM model demonstrates outstanding performance across all key metrics. First, the model achieves an accuracy of 85.4%, significantly outperforming both RF (81.3%) and SVM (56.3%), and slightly exceeding the high-performing XGBoost (84.1%), indicating its superior overall prediction accuracy. Additionally, the model attains a recall of 82.9%, comparable to RF (82.2%) and XGBoost (82.2%), and significantly higher than SVM (53.5%), highlighting its reliable ability to identify potential accident risks. At the same time, the precision of the model is 84.5%, surpassing all comparison models (RF: 80.4%, SVM: 60.2%, XGBoost: 83.7%), demonstrating the high reliability of its triggered risk alerts and minimizing the risk of false positives.</p>
<p>The model also achieves an F1 score of 83.7%, outperforming RF (81.3%), SVM (56.7%), and XGBoost (82.9%), effectively balancing the trade-off between accuracy and recall. The low False Negative Rate (FNR) of 17.1% is another notable advantage, slightly better than both RF (17.8%) and XGBoost (17.8%), and significantly improving upon SVM (46.5%), thus reducing the risk of missed accidents and enhancing the safety of the prediction system. Finally, the AUC value of the model is 0.891, surpassing all comparison models (RF: 0.849, SVM: 0.607, XGBoost: 0.875), indicating its superior ability to distinguish between accident and non-accident states across various classification thresholds.</p>
<p>In conclusion, the proposed LSTM model, integrating both dynamic and static features, not only excels in accuracy, precision, F1 score, and AUC, but also ensures efficient accident prediction through a lower FNR. The model&#x00027;s exceptional performance confirms the effectiveness of the LSTM architecture in capturing temporal features of vehicle dynamics and emphasizes the importance of the feature fusion mechanism in integrating static and dynamic information. These advantages make the model highly applicable to the safety prediction tasks for new energy vehicles.</p>
</sec>
<sec>
<title>4.4 Ablation study on feature and architecture contributions</title>
<p>To validate the contribution of different feature types and network components, we conducted an ablation study across five model configurations. The settings for each model are shown in <xref ref-type="table" rid="T5">Table 5</xref>. As shown in <xref ref-type="table" rid="T6">Table 6</xref>, using only static features (Model A) yields the weakest performance (F1 score = 64.6%, AUC = 0.652), suggesting their limited predictive value. Incorporating dynamic features with temporal modeling (Model B) significantly improves both AUC (0.791) and recall, reducing the false negative rate (FNR) from 27.5% to 25.7%. When all sequential features are used (Model C), performance further improves (F1 = 76.9%, AUC = 0.823), highlighting the benefit of comprehensive temporal input. A purely feed forward model (Model D) that fuses static and dynamic features, but without LSTM, performs better than the sequential-only model, achieving an F1 score of 80.9% and reducing FNR to 19.5%. Our proposed model (Model E) achieves the best overall performance across all metrics: F1 = 83.7%, FNR = 17.1%, and AUC = 0.891, confirming that both LSTM-based temporal modeling and feature fusion are critical to accurate accident risk prediction.</p>
<table-wrap position="float" id="T5">
<label>Table 5</label>
<caption><p>Model configurations for ablation study.</p></caption>
<table frame="box" rules="all">
<thead>
<tr style="background-color:#919498;color:#ffffff">
<th valign="top" align="left"><bold>Model ID</bold></th>
<th valign="top" align="left"><bold>Model name</bold></th>
<th valign="top" align="left"><bold>Feature input</bold></th>
<th valign="top" align="left"><bold>Feature type</bold></th>
<th valign="top" align="left"><bold>Uses LSTM</bold></th>
<th valign="top" align="left"><bold>Static feature fusion</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">A</td>
<td valign="top" align="left">Static-only baseline</td>
<td valign="top" align="left">Weather &#x0002B; road type</td>
<td valign="top" align="left">Static</td>
<td valign="top" align="left">No</td>
<td valign="top" align="left">No</td>
</tr>
<tr>
<td valign="top" align="left">B</td>
<td valign="top" align="left">Dynamic-only baseline</td>
<td valign="top" align="left">Speed &#x0002B; alarm</td>
<td valign="top" align="left">Dynamic</td>
<td valign="top" align="left">Yes</td>
<td valign="top" align="left">No</td>
</tr>
<tr>
<td valign="top" align="left">C</td>
<td valign="top" align="left">All sequential features only</td>
<td valign="top" align="left">Weather &#x0002B; road &#x0002B; speed &#x0002B; alarm</td>
<td valign="top" align="left">Dynamic</td>
<td valign="top" align="left">Yes</td>
<td valign="top" align="left">No</td>
</tr>
<tr>
<td valign="top" align="left">D</td>
<td valign="top" align="left">Static &#x0002B; sequential (no LSTM)</td>
<td valign="top" align="left">All features</td>
<td valign="top" align="left">Static &#x0002B; dynamic</td>
<td valign="top" align="left">No</td>
<td valign="top" align="left">Yes</td>
</tr>
<tr>
<td valign="top" align="left">E</td>
<td valign="top" align="left">Proposed (LSTM &#x0002B; fusion)</td>
<td valign="top" align="left">All features</td>
<td valign="top" align="left">Static &#x0002B; dynamic</td>
<td valign="top" align="left">Yes</td>
<td valign="top" align="left">Yes (fusion of static and dynamic)</td>
</tr></tbody>
</table>
</table-wrap>
<table-wrap position="float" id="T6">
<label>Table 6</label>
<caption><p>Ablation study results of different feature and architecture configurations.</p></caption>
<table frame="box" rules="all">
<thead>
<tr style="background-color:#919498;color:#ffffff">
<th valign="top" align="left"><bold>Model</bold></th>
<th valign="top" align="center"><bold>Accuracy</bold></th>
<th valign="top" align="center"><bold>Recall</bold></th>
<th valign="top" align="center"><bold>Precision</bold></th>
<th valign="top" align="center"><bold>F1 score</bold></th>
<th valign="top" align="center"><bold>FNR</bold></th>
<th valign="top" align="center"><bold>AUC</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">A</td>
<td valign="top" align="center">61.5%</td>
<td valign="top" align="center">72.5%</td>
<td valign="top" align="center">58.2%</td>
<td valign="top" align="center">64.6%</td>
<td valign="top" align="center">27.5%</td>
<td valign="top" align="center">0.652</td>
</tr>
<tr>
<td valign="top" align="left">B</td>
<td valign="top" align="center">75.0%</td>
<td valign="top" align="center">74.3%</td>
<td valign="top" align="center">73.7%</td>
<td valign="top" align="center">73.4%</td>
<td valign="top" align="center">25.7</td>
<td valign="top" align="center">0.791</td>
</tr>
<tr>
<td valign="top" align="left">C</td>
<td valign="top" align="center">78.2%</td>
<td valign="top" align="center">76.6%</td>
<td valign="top" align="center">77.2%</td>
<td valign="top" align="center">76.9%</td>
<td valign="top" align="center">23.4%</td>
<td valign="top" align="center">0.823</td>
</tr>
<tr>
<td valign="top" align="left">D</td>
<td valign="top" align="center">82.3%</td>
<td valign="top" align="center">80.5%</td>
<td valign="top" align="center">81.4%</td>
<td valign="top" align="center">80.9%</td>
<td valign="top" align="center">19.5%</td>
<td valign="top" align="center">0.861</td>
</tr>
<tr>
<td valign="top" align="left">E</td>
<td valign="top" align="center">85.4%</td>
<td valign="top" align="center">82.9%</td>
<td valign="top" align="center">84.5%</td>
<td valign="top" align="center">83.7%</td>
<td valign="top" align="center">17.1%</td>
<td valign="top" align="center">0.891</td>
</tr></tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec sec-type="conclusions" id="s5">
<title>5 Conclusion</title>
<p>This paper presents an accident risk prediction model for new energy vehicles based on dynamic-static feature fusion. First, both direct and indirect features strongly associated with accident risk are extracted from a full year of provincial accident data from 2021. Then, LSTM layers are employed to construct dynamic and static feature vectors that capture potential risk characteristics. Moreover, the accident risk probability is estimated using fully connected layers with a sigmoid activation function. Finally, the model is validated using real-world accident data. The results demonstrate that the model achieves an F1-score of 83.7% for accident prediction, enabling real-time identification of potential risks and timely driver warnings. This approach provides valuable data support for safety management and accident prevention in new energy vehicles, promoting the low-carbon and sustainable development of the automotive industry.</p>
<p>In the future, this study will collect accident data from multiple regions to verify and enhance the robustness of the proposed algorithm across different areas. Additionally, embedded encoding will replace one-hot encoding to better handle large-scale data processing, aiming to provide traffic management authorities with more accurate and comprehensive accident warning information for new energy vehicles.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s6">
<title>Data availability statement</title>
<p>The datasets presented in this article are not readily available because this research utilizes proprietary operational data obtained under strict confidentiality agreements with industry partners. Due to legal and privacy protections governing vehicular data in China (e.g., Personal Information Protection Law, PIPL), raw datasets containing personally identifiable information (PII) cannot be publicly shared. All analyzed features were anonymized and aggregated to comply with regulatory requirements. Requests to access the datasets should be directed to Xiang Zhang, <email>zhangxiang&#x00040;tmri.cn</email>.</p>
</sec>
<sec sec-type="author-contributions" id="s7">
<title>Author contributions</title>
<p>XZ: Writing &#x02013; original draft, Funding acquisition, Data curation, Resources. XY: Writing &#x02013; review &#x00026; editing. SH: Resources, Conceptualization, Validation, Writing &#x02013; review &#x00026; editing. GZ: Methodology, Writing &#x02013; original draft, Visualization. CW: Writing &#x02013; review &#x00026; editing.</p>
</sec>
<sec sec-type="funding-information" id="s8">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research and/or publication of this article. This research was funded by National Key R&#x00026;D Program of China, grant number 2022YFE0207800.</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="s9">
<title>Generative AI statement</title>
<p>The author(s) declare that no Gen AI was used in the creation of this manuscript.</p>
</sec>
<sec sec-type="disclaimer" id="s10">
<title>Publisher&#x00027;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ahmed</surname> <given-names>S.</given-names></name> <name><surname>Hossain</surname> <given-names>M. A.</given-names></name> <name><surname>Ray</surname> <given-names>S. K.</given-names></name> <name><surname>Bhuiyan</surname> <given-names>M. M. I.</given-names></name> <name><surname>Sabuj</surname> <given-names>S. R.</given-names></name></person-group> (<year>2023</year>). <article-title>A study on road accident prediction and contributing factors using explainable machine learning models: analysis and performance</article-title>. <source>Transp. Res. Interdiscip. Perspect.</source> <volume>19</volume>:<fpage>100814</fpage>. <pub-id pub-id-type="doi">10.1016/j.trip.2023.100814</pub-id></citation>
</ref>
<ref id="B2">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ardakani</surname> <given-names>S.</given-names></name> <name><surname>Liang</surname> <given-names>X.</given-names></name> <name><surname>Mengistu</surname> <given-names>K. T.</given-names></name> <name><surname>So</surname> <given-names>R. S.</given-names></name> <name><surname>Wei</surname> <given-names>X.</given-names></name> <name><surname>He</surname> <given-names>B.</given-names></name> <name><surname>Cheshmehzangi</surname> <given-names>A.</given-names></name></person-group> (<year>2023</year>). <article-title>Road car accident prediction using a machine-learning-enabled data analysis</article-title>. <source>Sustainability</source>, <volume>15</volume>, <fpage>5939</fpage>. <pub-id pub-id-type="doi">10.3390/su15075939</pub-id></citation>
</ref>
<ref id="B3">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Aung</surname> <given-names>N.</given-names></name> <name><surname>Zhang</surname> <given-names>W.</given-names></name> <name><surname>Dhelim</surname> <given-names>S.</given-names></name> <name><surname>Ai</surname> <given-names>Y.</given-names></name></person-group> (<year>2018</year>). <article-title>Accident prediction system based on hidden Markov model for vehicular ad-hoc network in urban environments</article-title>. <source>Information</source> <volume>9</volume>:<fpage>311</fpage>. <pub-id pub-id-type="doi">10.3390/info9120311</pub-id></citation>
</ref>
<ref id="B4">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Basso</surname> <given-names>F.</given-names></name> <name><surname>Pezoa</surname> <given-names>R.</given-names></name> <name><surname>Varas</surname> <given-names>M.</given-names></name> <name><surname>Villalobos</surname> <given-names>M.</given-names></name></person-group> (<year>2021</year>). <article-title>A deep learning approach for real-time crash prediction using vehicle-by-vehicle data</article-title>. <source>Accid. Anal. Prev.</source> <volume>162</volume>:<fpage>106409</fpage>. <pub-id pub-id-type="doi">10.1016/j.aap.2021.106409</pub-id><pub-id pub-id-type="pmid">34600313</pub-id></citation></ref>
<ref id="B5">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Berhanu</surname> <given-names>Y.</given-names></name> <name><surname>Alemayehu</surname> <given-names>E.</given-names></name> <name><surname>Schr&#x000F6;der</surname> <given-names>D.</given-names></name></person-group> (<year>2023</year>). <article-title>Examining car accident prediction techniques and road traffic congestion: a comparative analysis of road safety and prevention of world challenges in low-income and high-income countries</article-title>. <source>J. Adv. Transp.</source> <volume>2023</volume>:<fpage>6643412</fpage>. <pub-id pub-id-type="doi">10.1155/2023/6643412</pub-id></citation>
</ref>
<ref id="B6">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Br&#x000FC;hwiler</surname> <given-names>L.</given-names></name> <name><surname>Fu</surname> <given-names>C.</given-names></name> <name><surname>Huang</surname> <given-names>H.</given-names></name> <name><surname>Longhi</surname> <given-names>L.</given-names></name> <name><surname>Weibel</surname> <given-names>R.</given-names></name></person-group> (<year>2022</year>). <article-title>Predicting individuals&#x00027; car accident risk by trajectory, driving events, and geographical context</article-title>. <source>Comp. Environ. Urban Syst.</source> <volume>93</volume>:<fpage>101760</fpage>. <pub-id pub-id-type="doi">10.1016/j.compenvurbsys.2022.101760</pub-id></citation>
</ref>
<ref id="B7">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Casner</surname> <given-names>S. M.</given-names></name> <name><surname>Hutchins</surname> <given-names>E. L.</given-names></name> <name><surname>Norman</surname> <given-names>D.</given-names></name></person-group> (<year>2016</year>). <article-title>The challenges of partially automated driving</article-title>. <source>Commun. ACM</source> <volume>59</volume>, <fpage>70</fpage>&#x02013;<lpage>77</lpage>. <pub-id pub-id-type="doi">10.1145/2830565</pub-id><pub-id pub-id-type="pmid">32690975</pub-id></citation></ref>
<ref id="B8">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chakraborty</surname> <given-names>A.</given-names></name> <name><surname>Mukherjee</surname> <given-names>D.</given-names></name> <name><surname>Mitra</surname> <given-names>S.</given-names></name></person-group> (<year>2019</year>). <article-title>Development of pedestrian crash prediction model for a developing country using artificial neural network</article-title>. <source>Int. J. Inj. Control Saf. Promot.</source> <volume>26</volume>, <fpage>283</fpage>&#x02013;<lpage>293</lpage>. <pub-id pub-id-type="doi">10.1080/17457300.2019.1627463</pub-id><pub-id pub-id-type="pmid">31271110</pub-id></citation></ref>
<ref id="B9">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>B.</given-names></name> <name><surname>Yuan</surname> <given-names>W.</given-names></name> <name><surname>Rui Fu</surname> <given-names>R.</given-names></name> <name><surname>Guo</surname> <given-names>Y.-S.</given-names></name></person-group> (<year>2009</year>). <article-title>Analysis of traffic accident characteristic on continuous long downgrade section</article-title>. <source>J. Traffic Transp. Eng.</source> <volume>9</volume>, <fpage>75</fpage>&#x02013;<lpage>78</lpage>. <pub-id pub-id-type="doi">10.19818/j.cnki.1671-1637.2009.04.015</pub-id></citation>
</ref>
<ref id="B10">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Enache</surname> <given-names>N. M.</given-names></name> <name><surname>Netto</surname> <given-names>M.</given-names></name> <name><surname>Mammar</surname> <given-names>S.</given-names></name> <name><surname>Lusetti</surname> <given-names>B.</given-names></name></person-group> (<year>2009</year>). <article-title>Driver steering assistance for lane departure avoidance</article-title>. <source>Control Eng. Pract.</source> <volume>17</volume>, <fpage>642</fpage>&#x02013;<lpage>651</lpage>. <pub-id pub-id-type="doi">10.1016/j.conengprac.2008.10.012</pub-id></citation>
</ref>
<ref id="B11">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Feng</surname> <given-names>Z. G.</given-names></name> <name><surname>Huang</surname> <given-names>B. Y.</given-names></name> <name><surname>Liang</surname> <given-names>W. G.</given-names></name></person-group> (<year>2010</year>). <article-title>Mechanism analysis of the impact of natural environmental factors on road traffic safety</article-title>. <source>Shanxi Archit.</source> <volume>36</volume>, <fpage>301</fpage>&#x02013;<lpage>302</lpage>. <pub-id pub-id-type="doi">10.13719/j.cnki.cn14-1279/tu.2010.03.034</pub-id><pub-id pub-id-type="pmid">29653308</pub-id></citation></ref>
<ref id="B12">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ghasedi</surname> <given-names>M.</given-names></name> <name><surname>Sarfjoo</surname> <given-names>M.</given-names></name> <name><surname>Bargegol</surname> <given-names>I.</given-names></name></person-group> (<year>2021</year>). <article-title>Prediction and analysis of the severity and number of suburban accidents using logit model, factor analysis and machine learning: a case study in a developing country</article-title>. <source>SN Appl. Sci.</source> <volume>3</volume>:<fpage>13</fpage>. <pub-id pub-id-type="doi">10.1007/s42452-020-04081-3</pub-id></citation>
</ref>
<ref id="B13">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ghosh</surname> <given-names>B.</given-names></name> <name><surname>Karmakar</surname> <given-names>S.</given-names></name></person-group> (<year>2025</year>). <article-title>A safety assessment and accident prediction over national level highway using artificial neural network</article-title>. <source>J. Inst. Eng. India. Ser. A.</source> <fpage>1</fpage>&#x02013;<lpage>13</lpage>. <pub-id pub-id-type="doi">10.1007/s40030-025-00889-7</pub-id></citation>
</ref>
<ref id="B14">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hao</surname> <given-names>D.</given-names></name> <name><surname>Zhao</surname> <given-names>D. Q.</given-names></name> <name><surname>Kuang</surname> <given-names>L.</given-names></name></person-group> (<year>2015</year>). <article-title>Research and application of non-contact remote sensing pavement condition detection and early warning system</article-title>. <source>J. Transp. Sci. Eng.</source> <volume>31</volume>, <fpage>85</fpage>&#x02013;<lpage>91</lpage>. <pub-id pub-id-type="doi">10.16544/j.cnki.cn43-1494/u.2015.01.015</pub-id></citation>
</ref>
<ref id="B15">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hassan</surname> <given-names>H. M.</given-names></name> <name><surname>Abdel-Aty</surname> <given-names>M. A.</given-names></name></person-group> (<year>2011</year>). <article-title>Analysis of drivers&#x00027; behavior under reduced visibility conditions using a structural equation modeling approach</article-title>. <source>Transp. Res. Part F. Traffic Psychol. Behav.</source> <volume>14</volume>, <fpage>614</fpage>&#x02013;<lpage>625</lpage>. <pub-id pub-id-type="doi">10.1016/j.trf.2011.07.002</pub-id></citation>
</ref>
<ref id="B16">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hochreiter</surname> <given-names>S.</given-names></name> <name><surname>Schmidhuber</surname> <given-names>J.</given-names></name></person-group> (<year>1997</year>). <article-title>Long short-term memory</article-title>. <source>Neural Comput.</source> <volume>9</volume>, <fpage>1735</fpage>&#x02013;<lpage>1780</lpage>. <pub-id pub-id-type="doi">10.1162/neco.1997.9.8.1735</pub-id><pub-id pub-id-type="pmid">9377276</pub-id></citation></ref>
<ref id="B17">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kaffash Charandabi</surname> <given-names>N.</given-names></name> <name><surname>Gholami</surname> <given-names>A.</given-names></name> <name><surname>Abdollahzadeh Bina</surname> <given-names>A.</given-names></name></person-group> (<year>2022</year>). <article-title>Road accident risk prediction using generalized regression neural network optimized with self-organizing map</article-title>. <source>Neural Comp. Appl.</source> <volume>34</volume>, <fpage>8511</fpage>&#x02013;<lpage>8524</lpage>. <pub-id pub-id-type="doi">10.1007/s00521-021-06549-8</pub-id></citation>
</ref>
<ref id="B18">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Koramati</surname> <given-names>S.</given-names></name> <name><surname>Majumdar</surname> <given-names>B. B.</given-names></name> <name><surname>Pani</surname> <given-names>A.</given-names></name> <name><surname>Sahu</surname> <given-names>P. K.</given-names></name></person-group> (<year>2022</year>). <article-title>A registry-based investigation of road traffic fatality risk factors using police data: a case study of Hyderabad, India</article-title>. <source>Saf. Sci.</source> <volume>153</volume>:<fpage>105805</fpage>. <pub-id pub-id-type="doi">10.1016/j.ssci.2022.105805</pub-id></citation>
</ref>
<ref id="B19">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Chen</surname> <given-names>L.</given-names></name></person-group> (<year>2025</year>). <article-title>Traffic accident risk prediction based on deep learning and spatiotemporal features of vehicle trajectories</article-title>. <source>PLoS One</source> <volume>20</volume>:<fpage>e0320656</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0320656</pub-id><pub-id pub-id-type="pmid">40315419</pub-id></citation></ref>
<ref id="B20">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Yu</surname> <given-names>L.</given-names></name></person-group> (<year>2025</year>). <article-title>Prediction of traffic accident risk based on vehicle trajectory data</article-title>. <source>Traffic Injury Prev.</source> <volume>26</volume>, <fpage>164</fpage>&#x02013;<lpage>171</lpage>. <pub-id pub-id-type="doi">10.1080/15389588.2024.2402936</pub-id><pub-id pub-id-type="pmid">39570198</pub-id></citation></ref>
<ref id="B21">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lin</surname> <given-names>D. J.</given-names></name> <name><surname>Chen</surname> <given-names>M. Y.</given-names></name> <name><surname>Chiang</surname> <given-names>H. S.</given-names></name> <name><surname>Sharma</surname> <given-names>P. K.</given-names></name></person-group> (<year>2021</year>). <article-title>Intelligent traffic accident prediction model for Internet of Vehicles with deep learning approach</article-title>. <source>IEEE Trans. Intell. Transp. Syst.</source> <volume>23</volume>, <fpage>2340</fpage>&#x02013;<lpage>2349</lpage>. <pub-id pub-id-type="doi">10.1109/TITS.2021.3074987</pub-id></citation>
</ref>
<ref id="B22">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lin</surname> <given-names>L.</given-names></name> <name><surname>Wang</surname> <given-names>Q.</given-names></name> <name><surname>Sadek</surname> <given-names>A. W.</given-names></name></person-group> (<year>2015</year>). <article-title>A novel variable selection method based on frequent pattern tree for real-time traffic accident risk prediction</article-title>. <source>Transp. Res. Part C. Emerging Technol.</source> <volume>55</volume>, <fpage>444</fpage>&#x02013;<lpage>459</lpage>. <pub-id pub-id-type="doi">10.1016/j.trc.2015.03.015</pub-id></citation>
</ref>
<ref id="B23">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mandal</surname> <given-names>B.</given-names></name> <name><surname>Li</surname> <given-names>L.</given-names></name> <name><surname>Wang</surname> <given-names>G. S.</given-names></name> <name><surname>Lin</surname> <given-names>J.</given-names></name></person-group> (<year>2016</year>). <article-title>Towards detection of bus driver fatigue based on robust visual analysis of eye state</article-title>. <source>IEEE Trans. Intell. Transp. Syst.</source> <volume>18</volume>, <fpage>545</fpage>&#x02013;<lpage>557</lpage>. <pub-id pub-id-type="doi">10.1109/TITS.2016.2582900</pub-id></citation>
</ref>
<ref id="B24">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mantouka</surname> <given-names>E. G.</given-names></name> <name><surname>Barmpounakis</surname> <given-names>E. N.</given-names></name> <name><surname>Vlahogianni</surname> <given-names>E. I.</given-names></name></person-group> (<year>2019</year>). <article-title>Identification of driving safety profiles from smartphone data using machine learning techniques</article-title>. <source>Saf. Sci.</source> <volume>119</volume>, <fpage>84</fpage>&#x02013;<lpage>90</lpage>. <pub-id pub-id-type="doi">10.1016/j.ssci.2019.01.025</pub-id></citation>
</ref>
<ref id="B25">
<citation citation-type="book"><person-group person-group-type="author"><collab>Ministry of Public Security</collab></person-group> (<year>2024</year>). <source>The Number of Motor Vehicles in China Reaches 435 Million, with 523 Million Drivers, and the Number of New Energy Vehicles Exceeds 20 Million</source>. <publisher-loc>China</publisher-loc>: <publisher-name>The Central People&#x00027;s Government of the People&#x00027;s Republic of China</publisher-name>.</citation>
</ref>
<ref id="B26">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Najafi Moghaddam Gilani</surname> <given-names>V.</given-names></name> <name><surname>Hosseinian</surname> <given-names>S. M.</given-names></name> <name><surname>Ghasedi</surname> <given-names>M.</given-names></name> <name><surname>Nikookar</surname> <given-names>M.</given-names></name></person-group> (<year>2021</year>). <article-title>Data-driven urban traffic accident analysis and prediction using logit and machine learning-based pattern recognition models</article-title>. <source>Math. Probl. Eng.</source> <volume>2021</volume>:<fpage>9974219</fpage>. <pub-id pub-id-type="doi">10.1155/2021/9974219</pub-id></citation>
</ref>
<ref id="B27">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ning</surname> <given-names>H.</given-names></name> <name><surname>Xu</surname> <given-names>W.</given-names></name> <name><surname>Zhou</surname> <given-names>Y.</given-names></name> <name><surname>Gong</surname> <given-names>Y.</given-names></name> <name><surname>Huang</surname> <given-names>T. S.</given-names></name></person-group> (<year>2009</year>). <article-title>A general framework to detect unsafe system states from multisensor data stream</article-title>. <source>IEEE Trans. Intell. Transp. Syst.</source> <volume>11</volume>, <fpage>4</fpage>&#x02013;<lpage>15</lpage>. <pub-id pub-id-type="doi">10.1109/TITS.2009.2026446</pub-id></citation>
</ref>
<ref id="B28">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Park</surname> <given-names>R. C.</given-names></name> <name><surname>Hong</surname> <given-names>E. J.</given-names></name></person-group> (<year>2022</year>). <article-title>Urban traffic accident risk prediction for knowledge-based mobile multimedia service</article-title>. <source>Pers. Ubiquitous Comp.</source> <volume>26</volume>, <fpage>417</fpage>&#x02013;<lpage>427</lpage>. <pub-id pub-id-type="doi">10.1007/s00779-020-01442-y</pub-id></citation>
</ref>
<ref id="B29">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Prajapati</surname> <given-names>G.</given-names></name> <name><surname>Kumar</surname> <given-names>L.</given-names></name> <name><surname>Patil</surname> <given-names>S. R. S.</given-names></name></person-group> (<year>2023</year>). <article-title>Road accident prediction using machine learning</article-title>. <source>J. Sci. Res. Technol.</source> <fpage>48</fpage>&#x02013;<lpage>59</lpage>. <volume>1</volume>, <fpage>48</fpage>&#x02013;<lpage>59</lpage>. <pub-id pub-id-type="doi">10.5281/zenodo.7961680</pub-id></citation>
</ref>
<ref id="B30">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Ren</surname> <given-names>H.</given-names></name> <name><surname>Song</surname> <given-names>Y.</given-names></name> <name><surname>Wang</surname> <given-names>J.</given-names></name> <name><surname>Hu</surname> <given-names>Y.</given-names></name> <name><surname>Lei</surname> <given-names>J.</given-names></name></person-group> (<year>2018</year>). <article-title>&#x0201C;A deep learning approach to the citywide traffic accident risk prediction,&#x0201D;</article-title> in <source>2018 21st International Conference on Intelligent Transportation Systems (ITSC)</source> (<publisher-loc>Maui, HI</publisher-loc>: <publisher-name>IEEE</publisher-name>), <fpage>3346</fpage>&#x02013;<lpage>3351</lpage>. <pub-id pub-id-type="doi">10.1109/ITSC.2018.8569437</pub-id></citation>
</ref>
<ref id="B31">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Roland</surname> <given-names>J.</given-names></name> <name><surname>Way</surname> <given-names>P. D.</given-names></name> <name><surname>Firat</surname> <given-names>C.</given-names></name> <name><surname>Doan</surname> <given-names>T. N.</given-names></name> <name><surname>Sartipi</surname> <given-names>M.</given-names></name></person-group> (<year>2021</year>). <article-title>Modeling and predicting vehicle accident occurrence in Chattanooga, Tennessee</article-title>. <source>Accid. Anal. Prev.</source> <volume>149</volume>:<fpage>105860</fpage>. <pub-id pub-id-type="doi">10.1016/j.aap.2020.105860</pub-id><pub-id pub-id-type="pmid">33171397</pub-id></citation></ref>
<ref id="B32">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Santos</surname> <given-names>D.</given-names></name> <name><surname>Saias</surname> <given-names>J.</given-names></name> <name><surname>Quaresma</surname> <given-names>P.</given-names></name> <name><surname>Nogueira</surname> <given-names>V. B.</given-names></name></person-group> (<year>2021</year>). <article-title>Machine learning approaches to traffic accident analysis and hotspot prediction</article-title>. <source>Computers</source> <volume>10</volume>:<fpage>157</fpage>. <pub-id pub-id-type="doi">10.3390/computers10120157</pub-id><pub-id pub-id-type="pmid">40627630</pub-id></citation></ref>
<ref id="B33">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shaik</surname> <given-names>M. E.</given-names></name> <name><surname>Islam</surname> <given-names>M. M.</given-names></name> <name><surname>Hossain</surname> <given-names>Q. S.</given-names></name></person-group> (<year>2021</year>). <article-title>A review on neural network techniques for the prediction of road traffic accident severity</article-title>. <source>Asian Transp. Stud.</source> <volume>7</volume>:<fpage>100040</fpage>. <pub-id pub-id-type="doi">10.1016/j.eastsj.2021.100040</pub-id></citation>
</ref>
<ref id="B34">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shannon</surname> <given-names>C. E.</given-names></name></person-group> (<year>1948</year>). <article-title>A mathematical theory of communication</article-title>. <source>Bell Syst. Tech. J.</source> <volume>27</volume>, <fpage>379</fpage>&#x02013;<lpage>423</lpage>. <pub-id pub-id-type="doi">10.1002/j.1538-7305.1948.tb01338.x</pub-id></citation>
</ref>
<ref id="B35">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sun</surname> <given-names>W.</given-names></name> <name><surname>Abdullah</surname> <given-names>L. N.</given-names></name> <name><surname>Suhaiza Sulaiman</surname> <given-names>P.</given-names></name> <name><surname>Khalid</surname> <given-names>F.</given-names></name></person-group> (<year>2024</year>). <article-title>Meta-feature-based traffic accident risk prediction: a novel approach to forecasting severity and incidence</article-title>. <source>Vehicles</source> <volume>6</volume>, <fpage>728</fpage>&#x02013;<lpage>746</lpage>. <pub-id pub-id-type="doi">10.3390/vehicles6020034</pub-id><pub-id pub-id-type="pmid">28691578</pub-id></citation></ref>
<ref id="B36">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>S.</given-names></name> <name><surname>Zhang</surname> <given-names>J.</given-names></name> <name><surname>Li</surname> <given-names>J.</given-names></name> <name><surname>Miao</surname> <given-names>H.</given-names></name> <name><surname>Cao</surname> <given-names>J.</given-names></name></person-group> (<year>2021</year>). <article-title>Traffic accident risk prediction via multi-view multi-task spatio-temporal networks</article-title>. <source>IEEE Trans. Knowl. Data Eng.</source> <volume>35</volume>, <fpage>12323</fpage>&#x02013;<lpage>12336</lpage>. <pub-id pub-id-type="doi">10.1109/TKDE.2021.3135621</pub-id></citation>
</ref>
<ref id="B37">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>X. F.</given-names></name> <name><surname>Fu</surname> <given-names>X. S.</given-names></name> <name><surname>Ge</surname> <given-names>T.</given-names></name></person-group> (<year>2011</year>). <article-title>Driving risk evaluation model of freeway interchange entrance area</article-title>. <source>J. Traffic Transp. Eng.</source> <volume>11</volume>, <fpage>88</fpage>&#x02013;<lpage>92</lpage>. <pub-id pub-id-type="doi">10.19818/j.cnki.1671-1637.2011.05.014</pub-id></citation>
</ref>
<ref id="B38">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xiao</surname> <given-names>J.</given-names></name> <name><surname>Kulakowski</surname> <given-names>B. T.</given-names></name> <name><surname>EI-Gindy</surname> <given-names>M.</given-names></name></person-group> (<year>2000</year>). <article-title>Prediction of risk of wet-pavement accidents: fuzzy logic model</article-title>. <source>Transp. Res. Rec.</source> <volume>1717</volume>, <fpage>28</fpage>&#x02013;<lpage>36</lpage>. <pub-id pub-id-type="doi">10.3141/1717-05</pub-id></citation>
</ref>
<ref id="B39">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xu</surname> <given-names>C. C.</given-names></name></person-group> (<year>2013</year>). <article-title>Real time crash risk prediction model on freeways under nasty weather conditions</article-title>. <source>J. Jilin University</source> <volume>1</volume>, <fpage>73</fpage>&#x02013;<lpage>78</lpage>. <pub-id pub-id-type="doi">10.13229/j.cnki.jdxbgxb2013.01.036</pub-id></citation>
</ref>
<ref id="B40">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Xu</surname> <given-names>X. L.</given-names></name></person-group> (<year>2013</year>). <source>Study on the impact of asphalt pavement skid resistance on traffic safety</source> (Dissertation). <publisher-loc>Beijing</publisher-loc>: <publisher-name>Beijing University of Civil Engineering and Architecture</publisher-name>.</citation>
</ref>
<ref id="B41">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Yannis</surname> <given-names>G.</given-names></name> <name><surname>Dragomanovits</surname> <given-names>A.</given-names></name> <name><surname>Laiou</surname> <given-names>A.</given-names></name> <name><surname>La Torre</surname> <given-names>F.</given-names></name> <name><surname>Domenichini</surname> <given-names>L.</given-names></name> <name><surname>Richter</surname> <given-names>T.</given-names></name> <etal/></person-group>. (<year>2017</year>). <article-title>&#x0201C;Road traffic accident prediction modelling: a literature review,&#x0201D;</article-title> in <source>Proceedings of the Institution of Civil Engineers-Transport, Vol. 170, No. 5</source> (<publisher-name>Thomas Telford Ltd</publisher-name>), <fpage>245</fpage>&#x02013;<lpage>254</lpage>. <pub-id pub-id-type="doi">10.1680/jtran.16.00067</pub-id><pub-id pub-id-type="pmid">26962031</pub-id></citation></ref>
<ref id="B42">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yu</surname> <given-names>L.</given-names></name> <name><surname>Du</surname> <given-names>B.</given-names></name> <name><surname>Hu</surname> <given-names>X.</given-names></name> <name><surname>Sun</surname> <given-names>L.</given-names></name> <name><surname>Han</surname> <given-names>L.</given-names></name> <name><surname>Lv</surname> <given-names>W.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Deep spatio-temporal graph convolutional network for traffic accident prediction</article-title>. <source>Neurocomputing</source> <volume>423</volume>, <fpage>135</fpage>&#x02013;<lpage>147</lpage>. <pub-id pub-id-type="doi">10.1016/j.neucom.2020.09.043</pub-id><pub-id pub-id-type="pmid">40315419</pub-id></citation></ref>
<ref id="B43">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>S.</given-names></name> <name><surname>Khattak</surname> <given-names>A.</given-names></name> <name><surname>Matara</surname> <given-names>C. M.</given-names></name> <name><surname>Hussain</surname> <given-names>A.</given-names></name> <name><surname>Farooq</surname> <given-names>A.</given-names></name></person-group> (<year>2022</year>). <article-title>Hybrid feature selection-based machine learning classification system for the prediction of injury severity in single and multiple-vehicle accidents</article-title>. <source>PLoS One</source> <volume>17</volume>:<fpage>e0262941</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0262941</pub-id><pub-id pub-id-type="pmid">35108288</pub-id></citation></ref>
<ref id="B44">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhao</surname> <given-names>H.</given-names></name> <name><surname>Li</surname> <given-names>X.</given-names></name> <name><surname>Cheng</surname> <given-names>H.</given-names></name> <name><surname>Zhang</surname> <given-names>J.</given-names></name> <name><surname>Wang</surname> <given-names>Q.</given-names></name> <name><surname>Zhu</surname> <given-names>H.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Deep learning-based prediction of traffic accidents risk for internet of vehicles</article-title>. <source>China Commun.</source> <volume>19</volume>, <fpage>214</fpage>&#x02013;<lpage>224</lpage>. <pub-id pub-id-type="doi">10.23919/JCC.2022.02.017</pub-id></citation>
</ref>
<ref id="B45">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhao</surname> <given-names>H.</given-names></name> <name><surname>Yu</surname> <given-names>H.</given-names></name> <name><surname>Li</surname> <given-names>D.</given-names></name> <name><surname>Mao</surname> <given-names>T.</given-names></name> <name><surname>Zhu</surname> <given-names>H.</given-names></name></person-group> (<year>2019</year>). <article-title>Vehicle accident risk prediction based on AdaBoost-SO in VANETs</article-title>. <source>IEEE Access</source> <volume>7</volume>, <fpage>14549</fpage>&#x02013;<lpage>14557</lpage>. <pub-id pub-id-type="doi">10.1109/ACCESS.2019.2894176</pub-id><pub-id pub-id-type="pmid">26636576</pub-id></citation></ref>
<ref id="B46">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhao</surname> <given-names>S.</given-names></name> <name><surname>Cheng</surname> <given-names>P.</given-names></name> <name><surname>Schwebel</surname> <given-names>D. C.</given-names></name> <name><surname>Zhao</surname> <given-names>M.</given-names></name> <name><surname>Yang</surname> <given-names>L.</given-names></name> <name><surname>Xiao</surname> <given-names>W.</given-names></name> <etal/></person-group>. (<year>2025</year>). <article-title>Characteristics of media-reported road traffic crashes related to new energy vehicles in China</article-title>. <source>J. Saf. Res.</source> <volume>92</volume>, <fpage>48</fpage>&#x02013;<lpage>54</lpage>. <pub-id pub-id-type="doi">10.1016/j.jsr.2024.11.012</pub-id><pub-id pub-id-type="pmid">39986866</pub-id></citation></ref>
</ref-list>
</back>
</article>