<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Environ. Sci.</journal-id>
<journal-title>Frontiers in Environmental Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Environ. Sci.</abbrev-journal-title>
<issn pub-type="epub">2296-665X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1522933</article-id>
<article-id pub-id-type="doi">10.3389/fenvs.2025.1522933</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Environmental Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Evacuation path optimization algorithm for grassland fires based on SAR imagery and intelligent optimization</article-title>
<alt-title alt-title-type="left-running-head">Zhang et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fenvs.2025.1522933">10.3389/fenvs.2025.1522933</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Zhang</surname>
<given-names>Ziyang</given-names>
</name>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Tan</surname>
<given-names>Lingye</given-names>
</name>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2823383/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Tiong</surname>
<given-names>Robert L. K.</given-names>
</name>
<uri xlink:href="https://loop.frontiersin.org/people/1483997/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
</contrib-group>
<aff>
<institution>School of Civil and Environmental Engineering</institution>, <institution>Nanyang Technological University</institution>, <addr-line>Singapore</addr-line>, <country>Singapore</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/991374/overview">Felipe Augusto Pereira De Figueiredo</ext-link>, National Institute of Telecommunications, Brazil</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2656138/overview">Maryam Rahnemoonfar</ext-link>, Lehigh University, United States</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2139450/overview">Yaohui Liu</ext-link>, Shandong Jianzhu University, China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2604098/overview">Georgios Marios Karagiannis</ext-link>, International Coalition for Sustainable Infrastructure, United Kingdom</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Lingye Tan&#x2009;, <email>lingye001@e.ntu.edu.sg</email>
</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>18</day>
<month>03</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>13</volume>
<elocation-id>1522933</elocation-id>
<history>
<date date-type="received">
<day>13</day>
<month>11</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>24</day>
<month>02</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Zhang, Tan and Tiong.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Zhang, Tan and Tiong</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>The acceleration of urbanization and the impact of climate change have led to an increasing frequency and intensity of grassland fires, posing severe challenges to resident safety and ecological protection. Traditional static evacuation route planning methods struggle to adapt in real-time to the dynamic changes in fire conditions during emergency management. To address this issue, this paper proposes a grassland fire evacuation route optimization strategy based on the GreyGNN-MARL model. By integrating Synthetic Aperture Radar (Sentinel-1 SAR) imagery, Graph Neural Networks (GNNs), Grey Wolf Optimization (GWO) algorithms, and Multi-Agent Reinforcement Learning (MARL), the model achieves intelligent planning and real-time adjustment of dynamic evacuation routes in fire scenarios. Experimental results demonstrate that this model significantly outperforms traditional methods in terms of evacuation time, risk avoidance success rate, and path safety, with evacuation time reduced by over 25% and risk avoidance success rate improved by approximately 18%. This model provides technical support for emergency management of grassland fires, helping to enhance evacuation efficiency and ensure safety, which is of great significance for smart cities and ecological protection. Future research will focus on further optimizing the model&#x2019;s computational efficiency and applicability for broader use in fire emergency management in complex environments.</p>
</abstract>
<kwd-group>
<kwd>fire evacuation route</kwd>
<kwd>SAR imagery</kwd>
<kwd>pathfinding optimization</kwd>
<kwd>deep learning</kwd>
<kwd>multi-hazard ecosystem resilience</kwd>
<kwd>post-fire recovery</kwd>
<kwd>climate-adaptive decision-making</kwd>
</kwd-group>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Big Data, AI, and the Environment</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>In recent years, the frequency and intensity of wildfires have increased significantly around the world, especially in the Mediterranean, North America, South America, and Australia (<xref ref-type="bibr" rid="B24">Nur et al., 2022</xref>; <xref ref-type="bibr" rid="B47">Zhang et al., 2025</xref>). This trend not only threatens human life and property, but also has a profound impact on ecosystem recovery and carbon cycling (<xref ref-type="bibr" rid="B10">Ghali and Akhloufi, 2023</xref>). Climate change and intensified human activities are the main factors leading to the frequent occurrence of wildfires, causing a large loss of forest resources and weakening the self-recovery capacity of ecosystems (<xref ref-type="bibr" rid="B48">Zhang et al., 2021</xref>). In this context, traditional fire evacuation path planning usually focuses on the rapid evacuation of people, but it faces challenges in simultaneously considering the long-term recovery needs of ecosystems. Post-fire vegetation recovery, maintenance of carbon storage, and enhancement of ecosystem resilience have become key topics in current wildfire research and emergency management (<xref ref-type="bibr" rid="B3">Ban et al., 2020</xref>; <xref ref-type="bibr" rid="B8">Florath and Keller, 2022</xref>; <xref ref-type="bibr" rid="B16">Huang et al., 2025</xref>).</p>
<p>Ecosystem resilience is particularly important in areas where fires frequently occur. After a fire, vegetation needs to be restored to a certain coverage level to achieve carbon storage and environmental restoration goals (<xref ref-type="bibr" rid="B34">Tian et al., 2022</xref>). However, in areas with frequent fires and extreme weather, vegetation restoration faces many challenges, making it difficult to stabilize the carbon cycle (<xref ref-type="bibr" rid="B22">Lee et al., 2020</xref>). Therefore, how to balance ecosystem restoration during fire evacuation while enhancing the system&#x2019;s carbon absorption and storage capacity has become a research direction that urgently needs to be solved (<xref ref-type="bibr" rid="B32">Sun et al., 2021</xref>). In this context, path optimization technology based on intelligent algorithms provides a new idea for solving the comprehensive needs of fire evacuation and ecosystem restoration (<xref ref-type="bibr" rid="B18">Jiang et al., 2021</xref>).</p>
<p>This study proposes a GreyGNN-MARL model, which integrates graph neural networks (GNNs), gray wolf optimization (GWO) and multi-agent reinforcement learning (MARL) technology to provide effective support for path planning and ecosystem restoration in fire-prone areas. GNNs can construct complex geographic structure information in fire scenes and generate network structures of buildings, roads and vegetation, thereby providing a data basis for path optimization (<xref ref-type="bibr" rid="B19">Karimzadeh et al., 2022</xref>). GWO simulates the hunting behavior of gray wolves and dynamically optimizes the weights and parameters in path planning, aiming to minimize evacuation time while maximizing safety (<xref ref-type="bibr" rid="B13">Hu et al., 2021</xref>). In addition, MARL trains multiple agents (such as emergency evacuees) to collaborate in a dynamic fire environment, thereby facilitating the identification of optimal evacuation paths and strategies.</p>
<p>The main contribution of this research are as follows:<list list-type="simple">
<list-item>
<p>&#x2022; The fusion of multi-source data, including Sentinel-1 SAR imagery, global fire carbon emissions, and vegetation indices, utilizing Graph Neural Networks (GNNs) to construct complex geographical structural information in fire scenarios, achieving a unified modeling of path optimization and ecosystem recovery.</p>
</list-item>
<list-item>
<p>&#x2022; The introduction of the Grey Wolf Optimization (GWO) algorithm to dynamically adjust evacuation path weights and parameters, minimizing evacuation time while maximizing safety, providing intelligent support for path decision-making in high-frequency fire environments.</p>
</list-item>
<list-item>
<p>&#x2022; The implementation of Multi-Agent Reinforcement Learning (MARL) to enable agents to collaborate in dynamic fire environments, ensuring that evacuation path optimization not only prioritizes crowd safety but also supports post-fire ecosystem recovery and carbon storage.</p>
</list-item>
</list>
</p>
<p>This model is not only applicable to grass fires, but can also be extended to other types of fire scenarios, such as bush fuel fires. Through the fusion of multi-source data, the model can adapt to the characteristics of fires of different fuel types and achieve more flexible and efficient evacuation path optimization. By optimizing the selection of evacuation paths, the GreyGNN-MARL model not only reduces the time for crowd evacuation, but also helps reduce damage to vegetation and the environment, thereby providing more favorable conditions for subsequent ecological restoration. By combining multi-source data, the model can identify high-risk areas for fires and provide scientific path planning support for vegetation restoration and carbon storage, striving to reduce the negative effects of fire on the environment through path optimization and promote the sustainable recovery of the ecosystem.</p>
</sec>
<sec id="s2">
<title>2 Related work</title>
<sec id="s2-1">
<title>2.1 Fire evacuation path optimization algorithms</title>
<p>Fire evacuation path optimization algorithms play a critical role in emergency management during fires, with the primary goal of providing the safest and most effective evacuation routes for people during a fire event, thereby minimizing loss of life and property. Traditional path optimization methods typically rely on Geographic Information Systems (GIS) and classic graph-based algorithms, such as Dijkstra&#x2019;s and A&#x2a; algorithms, which can efficiently find the shortest paths in static environments (<xref ref-type="bibr" rid="B7">Chen et al., 2020</xref>; <xref ref-type="bibr" rid="B38">Wang et al., 2025a</xref>). However, these methods struggle to adapt to the real-time requirements of path safety and responsiveness in the rapidly changing conditions of a fire disaster, leading to limited practical application effectiveness (<xref ref-type="bibr" rid="B20">Kodipalli et al., 2023</xref>).</p>
<p>In recent years, with the advancement of deep learning and intelligent optimization algorithms, fire evacuation path optimization has gradually incorporated data-driven and intelligent optimization approaches to address the complexities of dynamic fire scenarios (<xref ref-type="bibr" rid="B30">Sharma et al., 2020</xref>; <xref ref-type="bibr" rid="B37">Wang et al., 2025b</xref>). Graph Neural Networks (GNNs) have emerged as a valuable tool in disaster management due to their advantages in processing graph-structured data. They can model complex geographical environments as graph structures and analyze the risks and fire spread in different areas, thus providing support for dynamic path planning (<xref ref-type="bibr" rid="B28">Salami et al., 2023</xref>). Meanwhile, intelligent optimization algorithms, such as Particle Swarm Optimization (PSO) and Ant Colony Optimization (ACO), exhibit strong global search capabilities in path optimization, enabling the identification of safe routes in risk environments created by fire spread (<xref ref-type="bibr" rid="B5">Bouguettaya et al., 2022</xref>). Nevertheless, relying solely on deep learning or optimization algorithms still presents limitations in practical fire evacuation path optimization, primarily due to a lack of dynamic updating mechanisms that can effectively respond to the rapid expansion of fire.</p>
<p>Furthermore, to enhance the intelligence and real-time capabilities of path planning, this paper primarily explores the application of Multi-Agent Reinforcement Learning (MARL) in evacuation path optimization. By simulating various evacuation strategies through the collaboration of multiple agents in dynamic environments, the model can dynamically adjust path planning to adapt to the rapid changes in fire conditions.</p>
</sec>
<sec id="s2-2">
<title>2.2 Application of SAR images in disaster management</title>
<p>In disaster management, Synthetic Aperture Radar (SAR) imagery has become an essential tool for monitoring natural disasters due to its all-weather, all-hour observation capabilities. SAR imagery can penetrate clouds and smoke, providing high-resolution surface information suitable for real-time monitoring of various disaster scenarios, including floods, earthquakes, and wildfires. Particularly in wildfire management, SAR imagery can clearly capture the areas affected by fires, the direction and rate of spread, offering robust data support for comprehensive monitoring and assessment of fire situations (<xref ref-type="bibr" rid="B12">Gupta et al., 2021</xref>; <xref ref-type="bibr" rid="B35">Tlijani et al., 2023</xref>). Traditional disaster management methods rely on ground sensors and video surveillance, which are limited in their application to large-scale fire scenarios and struggle to cover distant or dense fire areas. In contrast, SAR imagery not only provides real-time observations over a broader range but also acquires high-precision surface information, such as the location of fire sources, fire boundaries, vegetation density, and other critical features (<xref ref-type="bibr" rid="B19">Karimzadeh et al., 2022</xref>; <xref ref-type="bibr" rid="B31">Subramanian et al., 2023</xref>). By processing this SAR data, researchers can rapidly analyze fire dynamics after an outbreak, providing an accurate information foundation for disaster emergency decision-making (As shown in <xref ref-type="fig" rid="F1">Figure 1</xref>).</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Schematic diagram of the application of SAR imagery in fire emergency management (based on multi-platform applications in related research). Different SAR platforms used in traditional fire monitoring research, including satellite and aerial platforms. Please note that the SAR data used in this study came from the Sentinel-1 satellite platform, not the aerial platform.</p>
</caption>
<graphic xlink:href="fenvs-13-1522933-g001.tif"/>
</fig>
<p>In recent years, with the advancement of deep learning and intelligent analysis technologies, the accuracy and efficiency of SAR image processing have been greatly enhanced. Leveraging deep learning models such as Graph Neural Networks (GNN) and Convolutional Neural Networks (CNN), SAR imagery can be transformed into visual charts of fire situations, thereby supporting dynamic modeling of disaster scenarios (<xref ref-type="bibr" rid="B26">Pi et al., 2020</xref>; <xref ref-type="bibr" rid="B39">Wang and Wang, 2024</xref>; <xref ref-type="bibr" rid="B45">Yu and Zhenhua, 2024</xref>). However, many current studies still focus on the application of SAR imagery in disaster detection and monitoring, with less exploration of its potential in disaster evacuation path optimization. Although SAR imagery can provide precise information on fire spread, integrating it effectively into real-time decision-making for path planning remains an underexplored technical challenge (<xref ref-type="bibr" rid="B2">Alsamhi et al., 2021</xref>). Therefore, fully leveraging the data support role of SAR imagery in disaster management and combining it with evacuation path optimization models is an important direction for enhancing the speed and quality of wildfire emergency response and decision-making.</p>
</sec>
<sec id="s2-3">
<title>2.3 Application of hybrid optimization algorithms in path planning</title>
<p>In the field of path planning, hybrid optimization algorithms have gradually become an effective tool for path planning in complex environments due to their combination of global search and local optimization capabilities. These algorithms typically integrate various optimization methods, such as Particle Swarm Optimization (PSO), Ant Colony Optimization (ACO), and Genetic Algorithms (GA), and leverage machine learning models to enhance the adaptability and efficiency of the algorithms (<xref ref-type="bibr" rid="B14">Hu X. et al., 2023</xref>). By combining the strengths of different algorithms, hybrid optimization algorithms excel in multi-objective optimization, making them particularly suitable for dynamic path planning in complex disaster scenarios. In wildfire scenarios, path planning must consider not only conventional factors such as path length and time but also the potential threats of fire spread to the routes in real-time. Traditional path planning algorithms (like A&#x2a;, Dijkstra) can find the optimal path in static environments but struggle to cope with the real-time changes in fire conditions (<xref ref-type="bibr" rid="B42">Xu et al., 2022</xref>). To address this issue, researchers have begun to introduce hybrid optimization algorithms to improve the flexibility of path planning. These methods dynamically adjust the weight coefficients and sampling strategies in path selection, enabling the generation of safer and more stable evacuation routes in complex fire environments.</p>
<p>Furthermore, with the development of Multi-Agent Reinforcement Learning (MARL) technology, hybrid optimization algorithms have been increasingly applied to multi-agent collaborative path planning. MARL&#x2019;s application in fire scenarios can simulate the cooperation of multiple evacuation teams, adjusting routes in real-time to avoid collisions and adapt to the dynamic changes in fire conditions (<xref ref-type="bibr" rid="B43">Yang et al., 2022</xref>). However, although the combination of hybrid optimization algorithms and MARL can enhance the flexibility and dynamic adaptability of path planning, most existing studies focus on the theoretical aspects of the algorithms, lacking practical application explorations supported by multi-source data (<xref ref-type="bibr" rid="B27">Poudel and Moh, 2021</xref>). How to effectively integrate hybrid optimization algorithms with fire data (such as SAR imagery, fire emission data) to meet the path planning needs in wildfires remains a significant technical challenge.</p>
</sec>
</sec>
<sec sec-type="methods" id="s3">
<title>3 Methods</title>
<sec id="s3-1">
<title>3.1 Overall model framework</title>
<p>This study proposes the GreyGNN-MARL model, which aims to provide an intelligent solution for evacuation path optimization in grassland fire scenarios. The core goal of the model is to achieve real-time planning and adjustment of dynamic evacuation paths under fire environments by combining multi-source data with intelligent algorithms. The GreyGNN-MARL model consists of multiple modules, mainly including graph neural networks (GNN) modules, gray wolf optimization (GWO) modules, and multi-agent reinforcement learning (MARL) modules. Through the collaborative work of these modules, the model can optimize evacuation paths in real time in complex and dynamic fire environments. <xref ref-type="fig" rid="F2">Figure 2</xref> shows the overall architecture of the GreyGNN-MARL model, covering the complete process from multi-source data input to path planning output.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Overall structure of the GreyGNN-MARL model.</p>
</caption>
<graphic xlink:href="fenvs-13-1522933-g002.tif"/>
</fig>
<p>At the input layer of the model, GreyGNN-MARL combines multi-source data from Sentinel-1 SAR images, global fire emission data (GFED), vegetation index, etc., and structures the fire scene through data preprocessing. These data are processed by GNNs, where each path (track1, track2, track3) represents a different data processing flow. GNNs and SAR encoders are used to extract geographic and fire information from multi-source data to form a graph structure of the fire scene. In this process, nodes represent different geographical locations or evacuation areas, while edges represent the connection between nodes based on risk propagation or traffic accessibility. Through this graph structure, the model can dynamically capture the spread of fire and regional fire risk information.</p>
<p>After the graph structure is constructed, the model enters the GWO module, which performs preliminary optimization of the path based on the graph feature matrix of GNN. The GWO algorithm simulates the hunting strategy of gray wolf groups and uses adaptive sampling density to dynamically adjust the weights in path selection to generate multiple candidate evacuation paths. Compared with traditional path planning methods, the GWO module can prioritize avoiding high-risk areas and improve the safety and efficiency of path selection.</p>
<p>Then, the MARL module further optimizes the evacuation path through multi-agent collaboration. In a fire environment, the MARL module uses multiple agents to adjust the evacuation strategy in real time to cope with the dynamic changes caused by the spread of fire. Each agent represents an evacuation team, which ensures that each group of evacuees can avoid high-risk areas and adjust the evacuation path in real time by sharing information and collaborating. In a complex environment where the fire is dynamically expanding, the MARL module can continuously optimize the path to ensure that the evacuation process is more adaptable and intelligent.</p>
<p>Through the organic combination of GNN, GWO and MARL modules, the model forms a multi-level intelligent evacuation path optimization system that can dynamically optimize the path in a fire environment and improve the safety, real-time and adaptability of the evacuation path.</p>
</sec>
<sec id="s3-2">
<title>3.2 Graph neural networks module</title>
<p>The Graph Neural Network (GNN) module is the core component of the GreyGNN-MARL model used for constructing and analyzing the fire environment. Its main task is to convert fire scenes into graph structure representations based on multi-source data (such as SAR images, fire emission data, and vegetation indexes) to capture fire spread and regional risks at the node and edge levels. Through the GNN module, the model can effectively extract and process spatial and risk information in the fire environment, providing accurate fire risk and regional information support for the path optimization module (<xref ref-type="bibr" rid="B6">Chae et al., 2022</xref>; <xref ref-type="bibr" rid="B29">Sannidhan et al., 2023</xref>; <xref ref-type="bibr" rid="B40">Wang et al., 2022</xref>). As shown in <xref ref-type="fig" rid="F3">Figure 3</xref>, the architecture of the GNN module includes data preprocessing, feature initialization of nodes and edges, message passing, and aggregation steps.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>GNN module architecture and workflow. Nodes &#x201c;A&#x201d; and &#x201c;B&#x201d; represent different geographical locations and evacuation areas. Node features include geographical location, fire risk, vegetation cover, etc. Edges represent the connection between nodes, and weights reflect fire risk or traffic capacity.</p>
</caption>
<graphic xlink:href="fenvs-13-1522933-g003.tif"/>
</fig>
<p>Initially, the GNN module converts key geographical information and fire status in the fire scenario into a graph structure <inline-formula id="inf1">
<mml:math id="m1">
<mml:mrow>
<mml:mi>G</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>V</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>E</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>, where <inline-formula id="inf2">
<mml:math id="m2">
<mml:mrow>
<mml:mi>V</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> represents the set of nodes, indicating different geographical locations or evacuation areas, and <inline-formula id="inf3">
<mml:math id="m3">
<mml:mrow>
<mml:mi>E</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> represents the set of edges, connecting different nodes through travel or risk relationships. The initial features <inline-formula id="inf4">
<mml:math id="m4">
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> of each node <inline-formula id="inf5">
<mml:math id="m5">
<mml:mrow>
<mml:mi>v</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:mi>V</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> are initialized using the following formula:<disp-formula id="equ1">
<mml:math id="m6">
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x3d;</mml:mo>
<mml:mtext>MLP</mml:mtext>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2b;</mml:mo>
<mml:mtext>Embedding</mml:mtext>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mtext>Risk</mml:mtext>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>,</mml:mo>
<mml:mtext>Vegetation</mml:mtext>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf6">
<mml:math id="m7">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the geographical feature of the node, <inline-formula id="inf7">
<mml:math id="m8">
<mml:mrow>
<mml:mtext>Risk</mml:mtext>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> denotes the fire risk level of the node, and <inline-formula id="inf8">
<mml:math id="m9">
<mml:mrow>
<mml:mtext>Vegetation</mml:mtext>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> indicates the vegetation coverage. Through a multi-layer perceptron (MLP) and embedding layer, the GNN module transforms this information into an initial node feature vector suitable for message passing.</p>
<p>During the message passing phase, the GNN module propagates and aggregates fire and risk information through edges between each node, constructing dynamic features of the fire scenario. In the <inline-formula id="inf9">
<mml:math id="m10">
<mml:mrow>
<mml:mi>l</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>-th layer of message passing, the feature vector <inline-formula id="inf10">
<mml:math id="m11">
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>l</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> of node <inline-formula id="inf11">
<mml:math id="m12">
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is updated by the weighted aggregation of neighbor node features, with the formula being:<disp-formula id="equ2">
<mml:math id="m13">
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>l</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>&#x3c3;</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>W</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>l</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:msubsup>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>l</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x2b;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munder>
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>u</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:mi mathvariant="script">N</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:munder>
</mml:mstyle>
<mml:msubsup>
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>u</mml:mi>
<mml:mi>v</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>l</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:msubsup>
<mml:mrow>
<mml:mi>W</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>e</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>l</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:msubsup>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>u</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>l</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf12">
<mml:math id="m14">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>W</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>l</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf13">
<mml:math id="m15">
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mi>W</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>e</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>l</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> are the weight matrices for nodes and edges, respectively, <inline-formula id="inf14">
<mml:math id="m16">
<mml:mrow>
<mml:mi mathvariant="script">N</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> denotes the set of neighboring nodes of node <inline-formula id="inf15">
<mml:math id="m17">
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula id="inf16">
<mml:math id="m18">
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>u</mml:mi>
<mml:mi>v</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>l</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> is the attention weight for edge <inline-formula id="inf17">
<mml:math id="m19">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>u</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>v</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>, measuring the influence of node <inline-formula id="inf18">
<mml:math id="m20">
<mml:mrow>
<mml:mi>u</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> on node <inline-formula id="inf19">
<mml:math id="m21">
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>, and <inline-formula id="inf20">
<mml:math id="m22">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the activation function.</p>
<p>To further enhance the accuracy of risk propagation in fire scenarios, the GNN module introduces an attention mechanism in message passing to dynamically adjust the weights <inline-formula id="inf21">
<mml:math id="m23">
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>u</mml:mi>
<mml:mi>v</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>l</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> of edges, prioritizing the influence of high-risk nodes during fire spread. The attention weights <inline-formula id="inf22">
<mml:math id="m24">
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>u</mml:mi>
<mml:mi>v</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>l</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> are calculated using the following formula:<disp-formula id="equ3">
<mml:math id="m25">
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>u</mml:mi>
<mml:mi>v</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>l</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>exp</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mtext>LeakyReLU</mml:mtext>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>a</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x22a4;</mml:mo>
</mml:mrow>
</mml:msup>
<mml:mfenced open="[" close="]">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>W</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>l</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:msubsup>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>u</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>l</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mo stretchy="false">&#x2016;</mml:mo>
<mml:mtext>&#x2009;</mml:mtext>
<mml:msup>
<mml:mrow>
<mml:mi>W</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>l</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:msubsup>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>l</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:mi mathvariant="script">N</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2061;</mml:mo>
<mml:mi>exp</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mtext>LeakyReLU</mml:mtext>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>a</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x22a4;</mml:mo>
</mml:mrow>
</mml:msup>
<mml:mfenced open="[" close="]">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>W</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>l</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:msubsup>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>l</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mo stretchy="false">&#x2016;</mml:mo>
<mml:mtext>&#x2009;</mml:mtext>
<mml:msup>
<mml:mrow>
<mml:mi>W</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>l</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:msubsup>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>l</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf23">
<mml:math id="m26">
<mml:mrow>
<mml:mi>a</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the learned attention parameter vector, <inline-formula id="inf24">
<mml:math id="m27">
<mml:mrow>
<mml:mo stretchy="false">&#x2016;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> represents vector concatenation, and LeakyReLU is the activation function. This mechanism adaptively focuses on key nodes and high-risk edges in the fire scenario, ensuring more precise fire risk assessment during path optimization.</p>
<p>After multiple layers of message passing and feature aggregation, the GNN module outputs the final node features <inline-formula id="inf25">
<mml:math id="m28">
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>L</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> and edge feature matrices, reflecting the risk levels of various regions and their connectivity in the current fire scenario. The resulting graph structure information <inline-formula id="inf26">
<mml:math id="m29">
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is then input into the Grey Wolf Optimization (GWO) module to support further path planning and optimization.</p>
<p>The GNN module forms a high-dimensional feature representation of the fire scenario through multi-layer feature aggregation, dynamic adjustment of attention weights (<xref ref-type="bibr" rid="B9">Ge et al., 2022</xref>), and embedding of fire risks. This module not only effectively captures the spatial relationships in the fire environment but also dynamically models the fire spread process, laying a solid data foundation for real-time path planning in the GreyGNN-MARL model.</p>
</sec>
<sec id="s3-3">
<title>3.3 Grey wolf optimizer module</title>
<p>The Grey Wolf Optimizer (GWO) module in the GreyGNN-MARL model is responsible for generating preliminary path optimization in fire scenarios. Inspired by the hunting behavior of grey wolves, the GWO algorithm dynamically adjusts path sampling density and weight coefficients to provide global search and optimization capabilities for evacuation routes (<xref ref-type="bibr" rid="B33">Sun et al., 2024</xref>; <xref ref-type="bibr" rid="B41">Wei et al., 2024</xref>; <xref ref-type="bibr" rid="B1">Agarwal et al., 2023</xref>). In fire environments, the GWO module utilizes the graph feature matrix generated by the Graph Neural Network (GNN) to preliminarily plan multiple candidate paths, ensuring that evacuation routes can avoid high-risk areas as much as possible. As shown in <xref ref-type="fig" rid="F4">Figure 4</xref>, the GWO module includes key steps such as path initialization, dynamic sampling, and iterative optimization.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Gwo model structure diagram.</p>
</caption>
<graphic xlink:href="fenvs-13-1522933-g004.tif"/>
</fig>
<p>The GWO module initializes three main search agents: the alpha wolf (Alpha), beta wolf (Beta), and delta wolf (Delta), each playing different roles in path optimization. The positions of these three agents represent the coordinates of candidate evacuation routes, with the initialization formula as follows:<disp-formula id="equ4">
<mml:math id="m30">
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x3d;</mml:mo>
<mml:mtext>Initialize</mml:mtext>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mtext>start</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mtext>goal</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
<mml:mo>,</mml:mo>
<mml:mspace width="1em"/>
<mml:msubsup>
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x3b2;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x3d;</mml:mo>
<mml:mtext>RandomInit</mml:mtext>
<mml:mfenced open="(" close=")">
</mml:mfenced>
<mml:mo>()</mml:mo>
<mml:mo>,</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x3b4;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x3d;</mml:mo>
<mml:mtext>RandomInit</mml:mtext>
<mml:mo>()</mml:mo>
<mml:mfenced open="(" close=")">
</mml:mfenced>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf27">
<mml:math id="m31">
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> represents the initial position of the alpha wolf, initializing the path through the start and goal points, while <inline-formula id="inf28">
<mml:math id="m32">
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x3b2;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf29">
<mml:math id="m33">
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x3b4;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> are the random initial positions for the beta and delta wolves, respectively. This initialization ensures that the path search process can begin with multiple candidate paths, increasing path diversity.</p>
<p>During the path optimization process, the GWO module improves the evacuation route&#x2019;s risk avoidance effect by dynamically adjusting the sampling density. Specifically, the alpha, beta, and delta wolves repeatedly calculate the distances between each other to update their respective path positions. The path update formula for the <inline-formula id="inf30">
<mml:math id="m34">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>-th iteration is as follows:<disp-formula id="equ5">
<mml:math id="m35">
<mml:mrow>
<mml:mi>X</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>A</mml:mi>
<mml:mo>&#x22c5;</mml:mo>
<mml:mfenced open="|" close="|">
<mml:mrow>
<mml:mi>C</mml:mi>
<mml:mo>&#x22c5;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>X</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf31">
<mml:math id="m36">
<mml:mrow>
<mml:mi>A</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf32">
<mml:math id="m37">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> are control coefficients that adjust the convergence and exploration capabilities of the path. The coefficient <inline-formula id="inf33">
<mml:math id="m38">
<mml:mrow>
<mml:mi>A</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is dynamically calculated using the following formula:<disp-formula id="equ6">
<mml:math id="m39">
<mml:mrow>
<mml:mi>A</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>&#x22c5;</mml:mo>
<mml:mi>a</mml:mi>
<mml:mo>&#x22c5;</mml:mo>
<mml:mi>r</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>a</mml:mi>
<mml:mo>,</mml:mo>
<mml:mspace width="1em"/>
<mml:mi>a</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mn>2</mml:mn>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf34">
<mml:math id="m40">
<mml:mrow>
<mml:mi>T</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the maximum number of iterations, and <inline-formula id="inf35">
<mml:math id="m41">
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is a random number controlling the dynamic changes in sampling density and search range. By continuously adjusting the values of <inline-formula id="inf36">
<mml:math id="m42">
<mml:mrow>
<mml:mi>A</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf37">
<mml:math id="m43">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>, the GWO module can increase sampling in high-risk areas, thereby avoiding areas with strong fire spread and enhancing the safety of the path.</p>
<p>Additionally, to ensure the stability of the optimization process and the global nature of path selection, the GWO module comprehensively evaluates the path distances between the alpha, beta, and delta wolves in each iteration. The comprehensive path evaluation formula is as follows:<disp-formula id="equ7">
<mml:math id="m44">
<mml:mrow>
<mml:mtext>Fitness</mml:mtext>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x22c5;</mml:mo>
<mml:mtext>Distance</mml:mtext>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x22c5;</mml:mo>
<mml:mtext>Risk</mml:mtext>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x22c5;</mml:mo>
<mml:mtext>Smoothness</mml:mtext>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf38">
<mml:math id="m45">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula id="inf39">
<mml:math id="m46">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, and <inline-formula id="inf40">
<mml:math id="m47">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> are weight coefficients that control the proportion of path distance, fire risk, and path smoothness in the optimization. Through this formula, the GWO module can balance path length and risk avoidance, achieving multi-objective path optimization.</p>
<p>After multiple iterations and dynamic sampling, the GWO module generates a set of optimized candidate paths, with the selected paths having high safety and shorter evacuation times. These paths will serve as the initial path input for the Multi-Agent Reinforcement Learning (MARL) module, further supporting dynamic adjustment and real-time optimization of the paths. The GWO module provides an efficient preliminary path optimization method for the GreyGNN-MARL model through adaptive path sampling and multi-objective optimization strategies.</p>
</sec>
<sec id="s3-4">
<title>3.4 Multi-agent reinforcement learning module</title>
<p>Multi-Agent Reinforcement Learning (MARL) extends traditional reinforcement learning to environments where multiple agents interact. Each agent learns to optimize its strategy by receiving feedback from the environment while considering the presence and actions of other agents. In MARL, agents operate in a shared environment, learning to cooperate or compete to achieve individual or collective goals. Each agent simulates an &#x201c;evacuation team,&#x201d; which refers to a group of individuals who need to evacuate urgently during a fire, usually residents walking, residents riding bicycles, or families driving small vehicles (such as cars). We assume that these evacuation teams are small in size to allow for more flexible route adjustments and avoidance of high-risk areas for fires. Larger-scale transportation vehicles (such as buses) and large-scale team evacuations are not within the scope of this study&#x2019;s assumptions. The model focuses on the rapid evacuation of small-scale teams. As shown in <xref ref-type="fig" rid="F5">Figure 5</xref>, the MARL module includes the state space definition of the agent, the reward function design, and the policy update process.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Structural diagram of the GWO algorithm.</p>
</caption>
<graphic xlink:href="fenvs-13-1522933-g005.tif"/>
</fig>
<p>In the MARL module, the state <inline-formula id="inf41">
<mml:math id="m48">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> of each agent is composed of characteristics such as its position, fire risk information, and distances to neighboring agents, with the state defined by the following formula (<xref ref-type="bibr" rid="B46">Zhang et al., 2022</xref>):<disp-formula id="equ8">
<mml:math id="m49">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mfenced open="[" close="]">
<mml:mrow>
<mml:mtext>Position</mml:mtext>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
<mml:mo>,</mml:mo>
<mml:mtext>&#x2009;Risk</mml:mtext>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
<mml:mo>,</mml:mo>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mstyle displaystyle="true">
<mml:munder>
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:mi mathvariant="script">N</mml:mi>
</mml:mrow>
</mml:munder>
</mml:mstyle>
<mml:mtext>Distance</mml:mtext>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf42">
<mml:math id="m50">
<mml:mrow>
<mml:mtext>Position</mml:mtext>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> is the coordinate of the agent&#x2019;s current position, <inline-formula id="inf43">
<mml:math id="m51">
<mml:mrow>
<mml:mtext>Risk</mml:mtext>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> is the fire risk coefficient at the current position, and <inline-formula id="inf44">
<mml:math id="m52">
<mml:mrow>
<mml:mi mathvariant="script">N</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> denotes the set of neighboring agents. This state description allows agents to perceive changes in the surrounding fire and distances to neighbors in the dynamic environment, supporting path optimization.</p>
<p>Each agent selects an evacuation path by performing an action <inline-formula id="inf45">
<mml:math id="m53">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>a</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. The set of actions includes basic operations such as moving forward, turning, and waiting, and agents choose action <inline-formula id="inf46">
<mml:math id="m54">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>a</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> based on the current state <inline-formula id="inf47">
<mml:math id="m55">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> to avoid high-risk areas. The agents&#x2019; decisions follow a reinforcement learning-based policy update formula:<disp-formula id="equ9">
<mml:math id="m56">
<mml:mrow>
<mml:mi>Q</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>a</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2190;</mml:mo>
<mml:mi>Q</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>a</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>&#x3b1;</mml:mi>
<mml:mfenced open="[" close="]">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>&#x3b3;</mml:mi>
<mml:munder>
<mml:mrow>
<mml:mi>max</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>a</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:munder>
<mml:mi>Q</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mi>a</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>Q</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>a</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf48">
<mml:math id="m57">
<mml:mrow>
<mml:mi>Q</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>a</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> represents the state-action value function, <inline-formula id="inf49">
<mml:math id="m58">
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the learning rate, <inline-formula id="inf50">
<mml:math id="m59">
<mml:mrow>
<mml:mi>&#x3b3;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the discount factor, and <inline-formula id="inf51">
<mml:math id="m60">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the immediate reward obtained by the agent at time <inline-formula id="inf52">
<mml:math id="m61">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>. This update formula allows agents to balance exploration and exploitation, gradually learning the optimal strategy to avoid high-risk areas.</p>
<p>To achieve efficient risk avoidance, the MARL module designs a comprehensive reward function that considers factors such as path safety, evacuation time, and distances between agents. The reward function is defined as:<disp-formula id="equ10">
<mml:math id="m62">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x22c5;</mml:mo>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mtext>Risk</mml:mtext>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x22c5;</mml:mo>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mtext>Time</mml:mtext>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>a</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x22c5;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munder>
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:mi mathvariant="script">N</mml:mi>
</mml:mrow>
</mml:munder>
</mml:mstyle>
<mml:mtext>Distance</mml:mtext>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf53">
<mml:math id="m63">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula id="inf54">
<mml:math id="m64">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, and <inline-formula id="inf55">
<mml:math id="m65">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> are weight coefficients controlling the influence of risk avoidance, time minimization, and agent spacing in the reward. This reward mechanism provides agents with immediate feedback during the evacuation process, leading to the selection of efficient risk-avoiding paths.</p>
<p>During the training process of the MARL module, the model gradually optimizes path selection through the collaboration of multiple agents, enabling them to achieve dynamic path planning under changing fire conditions and uncertainties. Information sharing and state synchronization among agents also ensure global consistency in evacuation routes (<xref ref-type="bibr" rid="B36">&#xdc;nal et al., 2022</xref>; <xref ref-type="bibr" rid="B15">Hu Y. et al., 2023</xref>). To further optimize the strategy, agents update their decision policy using the following policy iteration formula:<disp-formula id="equ11">
<mml:math id="m66">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3c0;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>a</mml:mi>
<mml:mo stretchy="false">&#x7c;</mml:mo>
<mml:mi>s</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>exp</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>Q</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>a</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>/</mml:mo>
<mml:mi>&#x3c4;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>a</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msup>
<mml:mo>&#x2208;</mml:mo>
<mml:mi>A</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2061;</mml:mo>
<mml:mi>exp</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>Q</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mi>a</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
<mml:mo>/</mml:mo>
<mml:mi>&#x3c4;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf56">
<mml:math id="m67">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3c0;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>a</mml:mi>
<mml:mo stretchy="false">&#x7c;</mml:mo>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> represents the policy probability distribution, and <inline-formula id="inf57">
<mml:math id="m68">
<mml:mrow>
<mml:mi>&#x3c4;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the temperature coefficient controlling the level of exploration. By soft-maximizing the <inline-formula id="inf58">
<mml:math id="m69">
<mml:mrow>
<mml:mi>Q</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>-values, agents can explore a broader range of path choices while favoring the optimal strategy with higher <inline-formula id="inf59">
<mml:math id="m70">
<mml:mrow>
<mml:mi>Q</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>-values.</p>
<p>In summary, the MARL module enables the GreyGNN-MARL model to achieve intelligent evacuation route optimization in dynamic fire environments through collaborative learning and real-time decision-making among multiple agents, providing reliable technical support for real-time risk avoidance in complex disaster scenarios.</p>
</sec>
</sec>
<sec id="s4">
<title>4 Experiment</title>
<sec id="s4-1">
<title>4.1 Datasets</title>
<p>To ensure the practical application effectiveness of the GreyGNN-MARL model in grassland fire scenarios, this study selected high-quality public datasets that are multi-sourced and multi-dimensional, including the Sentinel-1 SAR dataset, the Global Fire Emissions Database (GFED), and the NASA LP DAAC vegetation index dataset. These datasets provide comprehensive fire scenario information, covering the geographical structure of the fire area, the spread trend of the fire, and the vegetation coverage, providing ample data support for path optimization in dynamic fire environments. <xref ref-type="table" rid="T1">Table 1</xref> shows an overview of the datasets and their application scenarios.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Summary of experimental datasets.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Dataset</th>
<th align="left">Data content</th>
<th align="left">Application scenarios</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Sentinel-1 SAR</td>
<td align="left">SAR imagery, including geographical information and fire source location of the fire area</td>
<td align="left">Capturing surface features, generating base graph structure of the fire area</td>
</tr>
<tr>
<td align="left">GFED</td>
<td align="left">Fire carbon emissions, fire intensity, and trend of change</td>
<td align="left">Labeling fire risk areas, dynamically simulating the spread of the fire</td>
</tr>
<tr>
<td align="left">NASA LP DAAC</td>
<td align="left">Vegetation indices (NDVI, EVI), vegetation density</td>
<td align="left">Assessing the impact of ecological characteristics on fire spread, assisting in constructing fire risk maps</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The Sentinel-1 SAR dataset provides all-weather, all-hour synthetic aperture radar imagery. SAR imagery can penetrate clouds and smoke, accurately acquiring the location of the fire source, fire boundaries, and surface features during the fire (<xref ref-type="bibr" rid="B21">Lasaponara et al., 2023</xref>). This information is used to generate the base graph structure of the fire area, helping the GNN module capture geographical features and fire dynamics in the fire scenario, providing high-precision input for environmental modeling in path planning.</p>
<p>The Global Fire Emissions Database (GFED) provides data on carbon emissions, fire intensity, and spread trends during the fire. GFED data reflects the activity of the fire source and the type of combustion during the fire occurrence period, which helps to label high-risk areas and dynamically simulate the expansion of the fire (<xref ref-type="bibr" rid="B25">Oliva et al., 2020</xref>). The model uses GFED data for real-time updates of risk areas, ensuring that evacuation routes avoid high-risk areas of fire spread, enhancing the safety of the evacuation process.</p>
<p>The NASA LP DAAC Vegetation Index dataset provides vegetation indices (such as NDVI and EVI) for grassland areas, as well as ecological characteristics such as vegetation coverage and density (<xref ref-type="bibr" rid="B17">Huot et al., 2022</xref>). In fire scenarios, vegetation density and type directly affect the speed of fire spread and the level of fire risk. Through vegetation data, the GNN module can model the fire scenario accurately, further enhancing the support for risk avoidance strategies in path planning. Evacuation routes, and enhanced evacuation efficiency and safety.</p>
</sec>
<sec id="s4-2">
<title>4.2 Experimental setup</title>
<p>The experiment was conducted in a high-performance computing environment to support large-scale data processing and efficient training of multi-module deep learning models. The hardware and software configurations and model parameter settings are shown in <xref ref-type="table" rid="T2">Table 2</xref> covering detailed configurations of hardware devices, software platforms, key hyperparameters, and model modules.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Experimental environment and model parameter settings.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Setting</th>
<th align="left">Configuration</th>
<th align="left">Details</th>
<th align="left">Setting</th>
<th align="left">Configuration</th>
<th align="left">Details</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="4" align="left">Hardware</td>
<td align="left">Processor</td>
<td align="left">2.4&#xa0;GHz, 28 cores</td>
<td rowspan="4" align="left">Software</td>
<td align="left">Operating System</td>
<td align="left">Ubuntu 18.04</td>
</tr>
<tr>
<td align="left">GPU</td>
<td align="left">NVIDIA Tesla V100, 32&#xa0;GB memory</td>
<td align="left">Deep Learning Framework</td>
<td align="left">PyTorch 1.8.1</td>
</tr>
<tr>
<td align="left">Memory</td>
<td align="left">128&#xa0;GB</td>
<td align="left">Graph Neural Network Library</td>
<td align="left">DGL 0.6.1</td>
</tr>
<tr>
<td align="left">Storage</td>
<td align="left">2&#xa0;TB SSD</td>
<td align="left">Data Processing Library</td>
<td align="left">NumPy 1.19, Pandas 1.1</td>
</tr>
<tr>
<td rowspan="5" align="left">Hyperparameters</td>
<td align="left">Learning Rate</td>
<td align="left">0.001</td>
<td rowspan="5" align="left">Configuration</td>
<td align="left">GNN Layers</td>
<td align="left">3 graph convolutional layers</td>
</tr>
<tr>
<td align="left">Batch Size</td>
<td align="left">64</td>
<td align="left">GWO Population Size</td>
<td align="left">30 grey wolves</td>
</tr>
<tr>
<td align="left">Maximum Number of Iterations</td>
<td align="left">500</td>
<td align="left">Number of MARL Agents</td>
<td align="left">5</td>
</tr>
<tr>
<td align="left">Discount Factor (MARL)</td>
<td align="left">0.95</td>
<td align="left">GNN Node Feature Dimension</td>
<td align="left">256 dimensions</td>
</tr>
<tr>
<td align="left">Number of Attention Heads (GNN)</td>
<td align="left">8</td>
<td align="left">MARL Policy Update Frequency</td>
<td align="left">Update every 5 steps</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s4-3">
<title>4.3 Evaluation metrics</title>
<p>To comprehensively evaluate the performance of the GreyGNN-MARL model in fire evacuation route optimization, this study designed multiple experimental metrics, including route planning time, risk avoidance success rate, route safety, route smoothness, and communication delay. These metrics quantitatively assess the model&#x2019;s performance from aspects of efficiency, safety, and stability, ensuring its reliability and application value in actual fire scenarios.</p>
<p>Route planning time refers to the average time required for the model to generate evacuation routes, calculated in seconds, used to measure the model&#x2019;s response efficiency.<disp-formula id="equ12">
<mml:math id="m71">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>T</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mtext>avg</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:munderover>
</mml:mstyle>
<mml:msub>
<mml:mrow>
<mml:mi>T</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf60">
<mml:math id="m72">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>T</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> represents the time for the <inline-formula id="inf61">
<mml:math id="m73">
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>-th planning, and <inline-formula id="inf62">
<mml:math id="m74">
<mml:mrow>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the total number of plannings. The shorter the route planning time, the faster the model&#x2019;s response speed, the better it meets the real-time evacuation needs in fire scenarios.</p>
<p>Risk avoidance success rate refers to the frequency at which the model successfully avoids high-risk areas in the fire environment, expressed as a percentage, used to evaluate the safety of route planning.<disp-formula id="equ13">
<mml:math id="m75">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>R</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mtext>safe</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mtext>safe</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>100</mml:mn>
<mml:mi>%</mml:mi>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf63">
<mml:math id="m76">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mtext>safe</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> represents the number of successful risk avoidances, and <inline-formula id="inf64">
<mml:math id="m77">
<mml:mrow>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the total number of tests. A higher risk avoidance success rate means the model has a higher adaptability to changes in the fire, effectively avoiding high-risk areas.</p>
<p>Route safety assesses the cumulative fire risk in the evacuation route, calculated using the fire risk weight <inline-formula id="inf65">
<mml:math id="m78">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mtext>risk</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and the risk values <inline-formula id="inf66">
<mml:math id="m79">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> of each node on the route:<disp-formula id="equ14">
<mml:math id="m80">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mtext>path</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>L</mml:mi>
</mml:mrow>
</mml:munderover>
</mml:mstyle>
<mml:msub>
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mtext>risk</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mo>&#x22c5;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf67">
<mml:math id="m81">
<mml:mrow>
<mml:mi>L</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the total length of the route. The lower the route safety, the more successful the route planning in avoiding high-risk areas, enhancing the safety of evacuation.</p>
<p>Route smoothness is used to measure the continuity and smoothness of the route, calculated by the angle changes between segments in the route:<disp-formula id="equ15">
<mml:math id="m82">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mtext>smooth</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:munderover>
</mml:mstyle>
<mml:mfenced open="|" close="|">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3b8;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3b8;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf68">
<mml:math id="m83">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3b8;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> represents the angle of the <inline-formula id="inf69">
<mml:math id="m84">
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>-th segment of the route. A smaller smoothness value indicates a more continuous and smooth route, reducing the number of emergency turns, which helps to improve the speed and safety of evacuation.</p>
<p>Communication delay refers to the delay time of the system in receiving and processing multi-source data, used to evaluate real-time responsiveness in IoT environments:<disp-formula id="equ16">
<mml:math id="m85">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>D</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mtext>comm</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:munderover>
</mml:mstyle>
<mml:msub>
<mml:mrow>
<mml:mi>d</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf70">
<mml:math id="m86">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>d</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the delay of the <inline-formula id="inf71">
<mml:math id="m87">
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>-th data transmission, and <inline-formula id="inf72">
<mml:math id="m88">
<mml:mrow>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the total number of transmissions. The lower the communication delay, the faster the model can obtain environmental information and adjust the route, helping to achieve efficient evacuation planning in fire environments.</p>
<p>These experimental metrics cover the model&#x2019;s response speed, the safety and smoothness of the route, and communication efficiency, ensuring the GreyGNN-MARL model has comprehensive performance in fire evacuation route optimization.</p>
</sec>
<sec id="s4-4">
<title>4.4 Results analysis and discussion</title>
<sec id="s4-4-1">
<title>4.4.1 Parameter tuning results</title>
<p>In this experiment, <xref ref-type="fig" rid="F6">Figure 6</xref> illustrates the performance of the GreyGNN-MARL model under different parameter settings, including the impact of learning rate and discount factor on model training outcomes.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Effect of different learning rates and discount factors on the training results of the GreyGNN-MARL model. <bold>(a)</bold> shows the change in the number of steps (steps per episode) that the agent performs in each session as the number of training sessions increases at different learning rates (0.001,0.01, and 0.1). <bold>(b)</bold> shows the training performance of the agents under different discount factors (0.99,0.999 and 1).</p>
</caption>
<graphic xlink:href="fenvs-13-1522933-g006.tif"/>
</fig>
<p>As shown in <xref ref-type="fig" rid="F6">Figure 6a</xref>, different learning rates significantly affect the agents&#x2019; performance during Multi-Agent Reinforcement Learning (MARL) training. With an increasing number of training epochs, all curves exhibit a clear downward trend, indicating that the agents are gradually learning more optimal evacuation strategies. Specifically, the curve for a learning rate of 0.1 (blue) shows a rapid initial decline and achieves a lower step count within fewer training epochs, suggesting that a higher learning rate can accelerate model convergence. However, as training progresses, the curve for a learning rate of 0.1 displays greater volatility, indicating that a high learning rate may lead to model instability. In contrast, the curves for learning rates of 0.01 (green) and 0.001 (red) are more stable in the later stages of training. Despite their slower convergence, they ultimately achieve better convergence results.</p>
<p>
<xref ref-type="fig" rid="F6">Figure 6b</xref> shows the impact of different discount factors on the agents&#x2019; training performance. The curve for a discount factor of 1 (blue) exhibits a rapid initial decline, reaching a lower step count within fewer training epochs, indicating that considering long-term rewards enables agents to quickly find optimal evacuation strategies. However, as training progresses, the curve for a discount factor of 1 shows significant fluctuations, suggesting that considering a too long-term reward period may lead to model instability in practical applications. In contrast, the curves for discount factors of 0.999 (green) and 0.99 (red) show a more stable downward trend throughout training, ultimately achieving lower and more stable step counts. The curve for a discount factor of 0.999 balances convergence speed and stability, demonstrating a better overall performance. This indicates that an appropriate discount factor can balance short-term and long-term rewards, enhancing the model&#x2019;s overall performance.</p>
</sec>
<sec id="s4-4-2">
<title>4.4.2 Ablation experiment results</title>
<p>In this study, we conducted ablation experiments on three datasets&#x2014;Sentinel-1 SAR Imagery, Global Fire Emissions Database (GFED), and NASA LP DAAC Vegetation Index&#x2014;to evaluate the impact of different modules on the overall performance of the GreyGNN-MARL model. By comparing the performance of the full model with versions where specific modules were removed, we can clearly see each module&#x2019;s contribution to overall performance.</p>
<p>As shown in <xref ref-type="table" rid="T3">Table 3</xref>, removing the GNN module significantly increases evacuation time and reduces the avoidance success rate, indicating the critical role of GNNs in extracting geographic structure information and optimizing the path. Similarly, removing the GWO module results in notable decreases in path safety and path smoothness, demonstrating the importance of the GWO module in optimizing path weights and parameters. When the MARL module is removed, communication delay increases, though other metrics are less affected, highlighting the MARL module&#x2019;s role in enhancing model collaboration and optimizing evacuation strategies. The full model performs best across all metrics, validating the effectiveness of the cooperative work of all modules.</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Ablation study results for the Sentinel-1 SAR Imagery dataset.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Model</th>
<th align="center">Evacuation time</th>
<th align="center">Avoidance success rate</th>
<th align="center">Path safety</th>
<th align="center">Path smoothness</th>
<th align="center">Communication delay</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">No GNNs</td>
<td align="center">24.67</td>
<td align="center">72.15%</td>
<td align="center">7.32</td>
<td align="center">14.52</td>
<td align="center">18.35</td>
</tr>
<tr>
<td align="center">No GWO</td>
<td align="center">39.52</td>
<td align="center">60.78%</td>
<td align="center">9.25</td>
<td align="center">15.34</td>
<td align="center">19.46</td>
</tr>
<tr>
<td align="center">No MARL</td>
<td align="center">27.91</td>
<td align="center">68.23%</td>
<td align="center">6.15</td>
<td align="center">13.78</td>
<td align="center">20.78</td>
</tr>
<tr>
<td align="center">Full Model</td>
<td align="center">19.35</td>
<td align="center">85.45%</td>
<td align="center">4.15</td>
<td align="center">10.25</td>
<td align="center">13.45</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>As shown in <xref ref-type="table" rid="T4">Table 4</xref>, removing the GNN module leads to a significant increase in evacuation time and a lower avoidance success rate, emphasizing the importance of GNNs in extracting dynamic fire information and optimizing the path. Removing the GWO module decreases path safety and path smoothness, highlighting the critical role of GWO in path weight and parameter optimization. Removing the MARL module increases communication delay, though other metrics are minimally affected, underscoring the importance of MARL in model collaboration and evacuation strategy optimization. The full model performs best across all metrics, affirming the benefits of all modules working in unison.</p>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>Ablation study results for the GFED dataset.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Model</th>
<th align="center">Evacuation time</th>
<th align="center">Avoidance success rate</th>
<th align="center">Path safety</th>
<th align="center">Path smoothness</th>
<th align="center">Communication delay</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">No GNNs</td>
<td align="center">28.54</td>
<td align="center">66.45%</td>
<td align="center">9.05</td>
<td align="center">16.72</td>
<td align="center">30.78</td>
</tr>
<tr>
<td align="center">No GWO</td>
<td align="center">27.85</td>
<td align="center">58.32%</td>
<td align="center">5.28</td>
<td align="center">17.18</td>
<td align="center">25.45</td>
</tr>
<tr>
<td align="center">No MARL</td>
<td align="center">29.93</td>
<td align="center">63.54%</td>
<td align="center">6.52</td>
<td align="center">15.12</td>
<td align="center">18.12</td>
</tr>
<tr>
<td align="center">Full Model</td>
<td align="center">21.25</td>
<td align="center">82.48%</td>
<td align="center">4.23</td>
<td align="center">11.35</td>
<td align="center">14.56</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>As shown in <xref ref-type="table" rid="T5">Table 5</xref>, removing the GNN module significantly increases evacuation time and reduces the avoidance success rate, highlighting the role of GNNs in constructing the fire scene network structure and optimizing the path. Removing the GWO module decreases path safety and path smoothness, illustrating the GWO module&#x2019;s critical role in optimizing path weights and parameters. Removing the MARL module increases communication delay, though other metrics are minimally affected, showing MARL&#x2019;s importance in enhancing model collaboration and optimizing evacuation strategies. The full model performs best across all metrics, validating the effectiveness of the cooperative work of all modules.</p>
<table-wrap id="T5" position="float">
<label>TABLE 5</label>
<caption>
<p>Ablation study results for the NASA LP DAAC Vegetation index dataset.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Model</th>
<th align="center">Evacuation time</th>
<th align="center">Avoidance success rate</th>
<th align="center">Path safety</th>
<th align="center">Path smoothness</th>
<th align="center">Communication delay</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">No GNNs</td>
<td align="center">30.12</td>
<td align="center">69.78%</td>
<td align="center">7.25</td>
<td align="center">15.84</td>
<td align="center">14.92</td>
</tr>
<tr>
<td align="center">No GWO</td>
<td align="center">42.19</td>
<td align="center">62.14%</td>
<td align="center">7.78</td>
<td align="center">18.12</td>
<td align="center">23.12</td>
</tr>
<tr>
<td align="center">No MARL</td>
<td align="center">34.76</td>
<td align="center">65.32%</td>
<td align="center">7.02</td>
<td align="center">16.47</td>
<td align="center">22.78</td>
</tr>
<tr>
<td align="center">Full Model</td>
<td align="center">20.72</td>
<td align="center">84.62%</td>
<td align="center">3.95</td>
<td align="center">12.54</td>
<td align="center">12.35</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Through analysis of the ablation experiment results across the three datasets, the vital roles of the GNN, GWO, and MARL modules in the GreyGNN-MARL model are evident. Each module enhances the model&#x2019;s performance in different aspects, confirming the rationality and effectiveness of the model design. These results provide important references for further optimization and improvement of the model.</p>
<p>According to the experimental results in <xref ref-type="table" rid="T6">Table 6</xref>, the model shows similar computational complexity and running efficiency on different datasets.</p>
<table-wrap id="T6" position="float">
<label>TABLE 6</label>
<caption>
<p>Training results of the GreyGNN-MARL model on the Sentinel-1 SAR image dataset, GFED dataset, and NASA LP DAAC vegetation index dataset.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Dataset</th>
<th align="center">Parameters (M)</th>
<th align="center">Flops (G)</th>
<th align="center">Inference time (ms)</th>
<th align="center">Training time (s)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">Sentinel-1 SAR Imagery</td>
<td align="center">15.2</td>
<td align="center">4.7</td>
<td align="center">120</td>
<td align="center">300</td>
</tr>
<tr>
<td align="center">GFED Dataset</td>
<td align="center">14.8</td>
<td align="center">4.5</td>
<td align="center">115</td>
<td align="center">290</td>
</tr>
<tr>
<td align="center">NASA LP DAAC Vegetation Index</td>
<td align="center">15.5</td>
<td align="center">4.8</td>
<td align="center">125</td>
<td align="center">310</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>On all datasets, the number of parameters of the model is between 15.2&#xa0;M and 15.5&#xa0;M, and the floating point operation volume is roughly between 4.5&#xa0;G and 4.8&#xa0;G, indicating that the computational requirements of the model on these three datasets are relatively consistent. The inference time is between 120&#xa0;ms and 125&#xa0;ms, showing that the model has good real-time response capabilities and can quickly optimize the evacuation path. The training time is slightly different on different datasets. The training time for the Sentinel-1 SAR image dataset is 300&#xa0;s, the GFED dataset is 290&#xa0;s, and the NASA LP DAAC vegetation index dataset is 310&#xa0;s. These results show that despite the different datasets, the model can still maintain a relatively stable computational efficiency during training. Overall, the GreyGNN-MARL model performs well in computational efficiency and performance, and can efficiently perform path optimization tasks in a variety of datasets and fire scenarios, proving its wide applicability and practicality. These experimental results also verify that the model has strong real-time response capabilities in practical applications, can quickly provide optimized evacuation paths in the response phase, and can process data of different complexities in the training phase.</p>
</sec>
<sec id="s4-4-3">
<title>4.4.3 Comparative experiment results</title>
<p>In the comparative experiments, we evaluated the performance of the GreyGNN-MARL model in fire evacuation path optimization against results from other traditional path planning algorithms and single-agent reinforcement learning algorithms. <xref ref-type="table" rid="T7">Tables 7</xref>&#x2013;<xref ref-type="table" rid="T9">9</xref> present the experimental results on the Sentinel-1 SAR Imagery, Global Fire Emissions Database (GFED), and NASA LP DAAC Vegetation Index datasets, respectively.</p>
<table-wrap id="T7" position="float">
<label>TABLE 7</label>
<caption>
<p>Comparison of different models on the Sentinel-1 SAR Imagery dataset.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Model</th>
<th align="center">Evacuation time</th>
<th align="center">Avoidance success rate</th>
<th align="center">Path safety</th>
<th align="center">Path smoothness</th>
<th align="center">Communication delay</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">A&#x2a; Algorithm (<xref ref-type="bibr" rid="B49">Zhu et al., 2024</xref>)</td>
<td align="center">28.45</td>
<td align="center">68.32%</td>
<td align="center">5.98</td>
<td align="center">16.32</td>
<td align="center">13.55</td>
</tr>
<tr>
<td align="center">Dijkstra Algorithm (<xref ref-type="bibr" rid="B23">Mirahadi and McCabe, 2021</xref>)</td>
<td align="center">30.76</td>
<td align="center">64.58%</td>
<td align="center">6.32</td>
<td align="center">17.84</td>
<td align="center">12.84</td>
</tr>
<tr>
<td align="center">Bellman-Ford Algorithm (<xref ref-type="bibr" rid="B4">Bhat et al., 2024</xref>)</td>
<td align="center">32.14</td>
<td align="center">66.74%</td>
<td align="center">5.87</td>
<td align="center">18.02</td>
<td align="center">14.67</td>
</tr>
<tr>
<td align="center">Floyd-Warshall Algorithm (<xref ref-type="bibr" rid="B11">G&#xf3;mez et al., 2023</xref>)</td>
<td align="center">29.86</td>
<td align="center">65.12%</td>
<td align="center">6.13</td>
<td align="center">17.34</td>
<td align="center">13.23</td>
</tr>
<tr>
<td align="center">Single-agent RL (<xref ref-type="bibr" rid="B44">Young and Aguirre, 2021</xref>)</td>
<td align="center">27.58</td>
<td align="center">69.45%</td>
<td align="center">5.74</td>
<td align="center">16.08</td>
<td align="center">14.08</td>
</tr>
<tr>
<td align="center">GreyGNN-MARL (Full Model)</td>
<td align="center">20.05</td>
<td align="center">85.45%</td>
<td align="center">3.94</td>
<td align="center">10.25</td>
<td align="center">11.43</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="T8" position="float">
<label>TABLE 8</label>
<caption>
<p>Comparison of different models on the GFED dataset.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Model</th>
<th align="center">Evacuation time</th>
<th align="center">Avoidance success rate</th>
<th align="center">Path safety</th>
<th align="center">Path smoothness</th>
<th align="center">Communication delay</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">A&#x2a; Algorithm</td>
<td align="center">30.92</td>
<td align="center">63.41%</td>
<td align="center">6.22</td>
<td align="center">17.32</td>
<td align="center">14.32</td>
</tr>
<tr>
<td align="center">Dijkstra Algorithm</td>
<td align="center">32.87</td>
<td align="center">62.58%</td>
<td align="center">6.48</td>
<td align="center">18.68</td>
<td align="center">13.68</td>
</tr>
<tr>
<td align="center">Bellman-Ford Algorithm</td>
<td align="center">34.15</td>
<td align="center">61.94%</td>
<td align="center">6.05</td>
<td align="center">18.47</td>
<td align="center">15.47</td>
</tr>
<tr>
<td align="center">Floyd-Warshall Algorithm</td>
<td align="center">31.68</td>
<td align="center">64.82%</td>
<td align="center">6.27</td>
<td align="center">17.06</td>
<td align="center">14.06</td>
</tr>
<tr>
<td align="center">Single-agent RL</td>
<td align="center">29.75</td>
<td align="center">67.17%</td>
<td align="center">5.89</td>
<td align="center">16.22</td>
<td align="center">15.22</td>
</tr>
<tr>
<td align="center">GreyGNN-MARL (Full Model)</td>
<td align="center">18.99</td>
<td align="center">82.48%</td>
<td align="center">4.23</td>
<td align="center">11.35</td>
<td align="center">14.56</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="T9" position="float">
<label>TABLE 9</label>
<caption>
<p>Comparison of different models on the NASA LP DAAC Vegetation Index dataset.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Model</th>
<th align="center">Evacuation time</th>
<th align="center">Avoidance success rate</th>
<th align="center">Path safety</th>
<th align="center">Path smoothness</th>
<th align="center">Communication delay</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">A&#x2a; Algorithm</td>
<td align="center">31.45</td>
<td align="center">66.34%</td>
<td align="center">6.34</td>
<td align="center">17.67</td>
<td align="center">13.67</td>
</tr>
<tr>
<td align="center">Dijkstra Algorithm</td>
<td align="center">33.87</td>
<td align="center">63.24%</td>
<td align="center">6.58</td>
<td align="center">18.98</td>
<td align="center">12.98</td>
</tr>
<tr>
<td align="center">Bellman-Ford Algorithm</td>
<td align="center">35.14</td>
<td align="center">62.48%</td>
<td align="center">6.21</td>
<td align="center">19.83</td>
<td align="center">14.83</td>
</tr>
<tr>
<td align="center">Floyd-Warshall Algorithm</td>
<td align="center">32.68</td>
<td align="center">65.17%</td>
<td align="center">6.41</td>
<td align="center">18.54</td>
<td align="center">13.54</td>
</tr>
<tr>
<td align="center">Single-agent RL</td>
<td align="center">30.75</td>
<td align="center">67.06%</td>
<td align="center">6.02</td>
<td align="center">16.29</td>
<td align="center">14.29</td>
</tr>
<tr>
<td align="center">GreyGNN-MARL (Full Model)</td>
<td align="center">18.18</td>
<td align="center">84.62%</td>
<td align="center">3.24</td>
<td align="center">12.54</td>
<td align="center">12.35</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>As shown in <xref ref-type="table" rid="T7">Table 7</xref>, the GreyGNN-MARL model demonstrates the best performance across all metrics. In terms of evacuation time, the GreyGNN-MARL model achieves an evacuation time of 20.05, significantly lower than the best-performing traditional algorithm (Single-agent RL), which has an evacuation time of 27.58. For avoidance success rate, the GreyGNN-MARL model achieves 85.45%, much higher than other models, showing its superior ability to navigate around high-risk areas. In terms of path safety, the GreyGNN-MARL model scores 3.94, significantly better than other models, indicating its advantage in selecting safer paths. Additionally, the GreyGNN-MARL model outperforms other models in path smoothness and communication delay, further validating its superior performance in complex fire environments.</p>
<p>According to the results in <xref ref-type="table" rid="T8">Table 8</xref>, the GreyGNN-MARL model also outperforms other models on the GFED dataset. Specifically, the GreyGNN-MARL model achieves an evacuation time of 18.99, significantly lower than the best-performing traditional algorithm (Single-agent RL), which has an evacuation time of 29.75. For avoidance success rate, the GreyGNN-MARL model achieves 82.48%, showing its strong capability to navigate efficiently in fire scenarios. In terms of path safety, the GreyGNN-MARL model scores 4.23, significantly safer than other models. Additionally, the GreyGNN-MARL model shows superior performance in path smoothness and communication delay, demonstrating its effectiveness in fire evacuation path optimization.</p>
<p>As shown in <xref ref-type="table" rid="T9">Table 9</xref>, the GreyGNN-MARL model significantly outperforms other models on the NASA LP DAAC Vegetation Index dataset. In terms of evacuation time, the GreyGNN-MARL model achieves an evacuation time of 18.18, significantly lower than the best-performing traditional algorithm (Single-agent RL), which has an evacuation time of 30.75. For avoidance success rate, the GreyGNN-MARL model achieves 84.62%, indicating its significant advantage in navigating high-risk areas. The GreyGNN-MARL model also demonstrates superior performance in path safety, path smoothness, and communication delay, further validating its advantages in complex fire environments.</p>
<p>The GreyGNN-MARL model consistently outperforms traditional path planning algorithms and single-agent reinforcement learning algorithms across various datasets, demonstrating its significant advantages in fire evacuation path optimization. These results validate the effectiveness and reliability of the GreyGNN-MARL model in practical applications.</p>
</sec>
<sec id="s4-4-4">
<title>4.4.4 Evacuation path results</title>
<p>
<xref ref-type="fig" rid="F7">Figure 7</xref> illustrates the fire localization and dynamic monitoring process in fire evacuation route planning. <xref ref-type="fig" rid="F7">Figure 7a</xref> shows the initial satellite image of the fire area, with the yellow contour representing the boundary of the study area. <xref ref-type="fig" rid="F7">Figure 7b</xref> further focuses on the area where the fire is most concentrated, marking the high-risk fire area with a black frame, showing the concentrated distribution of the fire and helping to identify the main direction of fire spread. <xref ref-type="fig" rid="F7">Figure 7c</xref> displays the evacuation distribution of agents during the fire simulation process, with orange and pink markers representing different evacuation agents, showing their concentrated avoidance and evacuation distribution in high-risk fire areas. Through this visualization result, it can be seen that the model effectively identifies and locates high-risk fire areas using multi-source data, and achieves avoidance and evacuation optimization in high-risk areas through dynamic path adjustments of agents. The fire spread and evacuation point distribution in the figure indicate that the model can adjust evacuation strategies in real-time according to fire changes in the fire environment, ensuring the safety and efficiency of evacuation routes.</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Fire localization and agent distribution in fire monitoring and evacuation route planning. <bold>(a)</bold> Shows the initial fire satellite image of the study area, with the yellow contour as the boundary of the study area; <bold>(b)</bold> focuses on the fire-concentrated area, marking the high-risk fire area with a black frame; <bold>(c)</bold> shows the evacuation distribution of agents during the fire simulation process, with orange and pink markers indicating different agents.</p>
</caption>
<graphic xlink:href="fenvs-13-1522933-g007.tif"/>
</fig>
<p>
<xref ref-type="fig" rid="F8">Figure 8</xref> shows the fire spread dynamics and fire boundary identification process in the fire area. In <xref ref-type="fig" rid="F8">Figure 8a</xref>, a satellite image of the early stage of the fire is shown, and the purple area indicates the main burning range of the fire. Through <xref ref-type="fig" rid="F8">Figure 8b</xref>, combined with geographic information system (GIS) data, the high-risk area of the fire area is marked in red, and the yellow boundary line marks the outer edge of the fire, providing the geographical boundary of the fire spread. This image highlights the high-risk area of the fire and its outer boundary, which is convenient for further analysis of the trend of fire spread. <xref ref-type="fig" rid="F8">Figure 8c</xref> shows the boundary detection results of the fire area, where the yellow boundary line clearly outlines the expansion range of the fire, can track the dynamic changes of the fire in real time, and provides an important basis for subsequent evacuation route planning. Through these visualization results, we can clearly see the high-precision performance of the model in fire monitoring and boundary identification.</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>Visualization of fire spread dynamics and fire boundary identification in the fire area (Color Description: purple indicates the main burning area of the fire, red indicates the high-risk area, and yellow indicates the outer edge of the fire. Part <bold>(a)</bold> shows the initial fire spread, <bold>(b)</bold> shows the high-risk area, and <bold>(c)</bold> shows the outer boundary of the fire).</p>
</caption>
<graphic xlink:href="fenvs-13-1522933-g008.tif"/>
</fig>
<p>
<xref ref-type="fig" rid="F9">Figure 9</xref> shows the distribution of buildings in the fire scenario and the evacuation route planning recommended by the model. The large image on the left shows the dense distribution of buildings in the fire-affected area, with the black area representing high-risk buildings for fire. Through the red magnifying glass display, the right side of the figure further enlarges the layout details of the buildings in this area to more clearly show the structure of the high-risk fire area. The bottom figure shows the details of the evacuation routes planned by the model in the high-risk area, with paths avoiding dense buildings and fire hotspot areas to ensure safe evacuation. From <xref ref-type="fig" rid="F9">Figure 9</xref>, it can be seen that the model in this paper can carry out efficient path planning under complex building layouts. The model&#x2019;s path recommendations in high-risk fire areas take into account building density, fire risk levels, and path smoothness, generating evacuation routes that avoid fire hotspots and dense areas, providing relatively safe passages for evacuating personnel. This intelligent path planning has important practical value in fire environments, helping to reduce evacuation time and increase the success rate of risk avoidance. The result verifies the model&#x2019;s ability to plan effective evacuation routes in complex urban environments.</p>
<fig id="F9" position="float">
<label>FIGURE 9</label>
<caption>
<p>Building distribution in fire scenarios and details of evacuation route planning.</p>
</caption>
<graphic xlink:href="fenvs-13-1522933-g009.tif"/>
</fig>
</sec>
</sec>
</sec>
<sec sec-type="conclusion" id="s5">
<title>5 Conclusion</title>
<p>This paper proposes a grassland fire evacuation route optimization strategy based on the GreyGNN-MARL model to address the dynamic and complex evacuation needs in grassland fires. The model integrates the real-time monitoring capabilities of Synthetic Aperture Radar (SAR) imagery, the structured extraction of fire scene geographic information by Graph Neural Networks (GNNs), the dynamic adjustment of path weights by the Grey Wolf Optimization (GWO) algorithm, and the intelligent collaboration of Multi-Agent Reinforcement Learning (MARL) in high-risk environments, successfully achieving the intelligent planning and dynamic optimization of grassland fire evacuation routes. Experimental results show that the GreyGNN-MARL model significantly outperforms traditional evacuation route planning methods in terms of evacuation time, risk avoidance success rate, route safety, route smoothness, and communication delay, especially in dynamic fire scenarios, providing effective technical support for emergency management of grassland fires.</p>
<p>Although this study has achieved good experimental results, there are still some limitations. First, the applicability and performance of the model in larger-scale and more complex fire scenarios have not been fully verified. The current experiments are mainly based on simulated environments and limited data sets. Practical applications may face more complex terrain, climate change and sudden fire situations, which may affect the stability and response speed of the model. Secondly, the training and optimization process of the model is relatively complex, and the demand for computing resources is high, which may bring challenges in practical applications with limited resources, especially in the real-time evacuation decision-making process. How to ensure rapid response is still a problem that needs to be further solved. In addition, when dealing with various types of fires, cross-regional evacuations, etc., the model may require additional adaptation and optimization to ensure its wide application in various fire emergency scenarios.</p>
<p>In future research, we will further optimize the GreyGNN-MARL model to improve its applicability and computational efficiency in complex fire scenarios, and ensure that evacuation route planning can respond more quickly to dynamic changes at the fire scene. In order to enhance the practicality of the model, we plan to apply it to real fire data for verification, especially through cooperation with emergency management departments, using real-time data from actual grassland fires and other types of fires to verify the effectiveness of the model. In addition, we will introduce more actual fire data for verification to further explore the application potential of the model in emergency safety management, especially in fire spread prediction and risk avoidance decision-making. At the same time, we also plan to combine more advanced optimization algorithms and intelligent technologies to strive to further improve the performance and security of the model, provide more solid technical support for grassland fire emergency response, and contribute to future grassland ecological protection and security.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s6">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/supplementary material, further inquiries can be directed to the corresponding author.</p>
</sec>
<sec sec-type="author-contributions" id="s7">
<title>Author contributions</title>
<p>ZZ: Data curation, Investigation, Project administration, Visualization, Writing&#x2013;review and editing. LT: Data curation, Formal Analysis, Investigation, Resources, Writing&#x2013;original draft. RT: Methodology, Resources, Software, Validation, Writing&#x2013;review and editing.</p>
</sec>
<sec sec-type="funding-information" id="s8">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research, authorship, and/or publication of this article.</p>
</sec>
<sec sec-type="COI-statement" id="s9">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="s10">
<title>Generative AI statement</title>
<p>The author(s) declare that no Generative AI was used in the creation of this manuscript.</p>
</sec>
<sec sec-type="disclaimer" id="s11">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Agarwal</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Tapaswi</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Chanak</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Intelligent emergency evacuation system for industrial environments using iot-enabled wsns</article-title>. <source>IEEE Trans. Instrum. Meas.</source> <volume>72</volume>, <fpage>1</fpage>&#x2013;<lpage>12</lpage>. <pub-id pub-id-type="doi">10.1109/tim.2023.3328071</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alsamhi</surname>
<given-names>S. H.</given-names>
</name>
<name>
<surname>Almalki</surname>
<given-names>F. A.</given-names>
</name>
<name>
<surname>Al-Dois</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Shvetsov</surname>
<given-names>A. V.</given-names>
</name>
<name>
<surname>Ansari</surname>
<given-names>M. S.</given-names>
</name>
<name>
<surname>Hawbani</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Multi-drone edge intelligence and sar smart wearable devices for emergency communication</article-title>. <source>Wirel. Commun. Mob. Comput.</source> <volume>2021</volume>, <fpage>6710074</fpage>. <pub-id pub-id-type="doi">10.1155/2021/6710074</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ban</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Nascetti</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Bevington</surname>
<given-names>A. R.</given-names>
</name>
<name>
<surname>Wulder</surname>
<given-names>M. A.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Near real-time wildfire progression monitoring with sentinel-1 sar time series and deep learning</article-title>. <source>Sci. Rep.</source> <volume>10</volume>, <fpage>1322</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-019-56967-x</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bhat</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Rao</surname>
<given-names>P. K.</given-names>
</name>
<name>
<surname>Kamath</surname>
<given-names>C. R.</given-names>
</name>
<name>
<surname>Tandon</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Vizzapu</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Comparative analysis of bellman-ford and dijkstra&#x2019;s algorithms for optimal evacuation route planning in multi-floor buildings</article-title>. <source>Cogent Eng.</source> <volume>11</volume>, <fpage>2319394</fpage>. <pub-id pub-id-type="doi">10.1080/23311916.2024.2319394</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bouguettaya</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Zarzour</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Taberkit</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Kechida</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>A review on early wildfire detection from unmanned aerial vehicles using deep learning-based computer vision algorithms</article-title>. <source>Signal Process.</source> <volume>190</volume>, <fpage>108309</fpage>. <pub-id pub-id-type="doi">10.1016/j.sigpro.2021.108309</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chae</surname>
<given-names>Y. H.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Seong</surname>
<given-names>P. H.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Graph neural network based multiple accident diagnosis in nuclear power plants: data optimization to represent the system configuration</article-title>. <source>Nucl. Eng. Technol.</source> <volume>54</volume>, <fpage>2859</fpage>&#x2013;<lpage>2870</lpage>. <pub-id pub-id-type="doi">10.1016/j.net.2022.02.024</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Mao</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Deng</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Application of the best evacuation model of deep learning in the design of public structures</article-title>. <source>Image Vis. Comput.</source> <volume>102</volume>, <fpage>103975</fpage>. <pub-id pub-id-type="doi">10.1016/j.imavis.2020.103975</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Florath</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Keller</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Supervised machine learning approaches on multispectral remote sensing data for a combined detection of fire and burned area</article-title>. <source>Remote Sens.</source> <volume>14</volume>, <fpage>657</fpage>. <pub-id pub-id-type="doi">10.3390/rs14030657</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ge</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Peng</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Spatio-temporal knowledge graph based forest fire prediction with multi source heterogeneous data</article-title>. <source>Remote Sens.</source> <volume>14</volume>, <fpage>3496</fpage>. <pub-id pub-id-type="doi">10.3390/rs14143496</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ghali</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Akhloufi</surname>
<given-names>M. A.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Deep learning approaches for wildland fires using satellite remote sensing data: detection, mapping, and prediction</article-title>. <source>Fire</source> <volume>6</volume>, <fpage>192</fpage>. <pub-id pub-id-type="doi">10.3390/fire6050192</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>G&#xf3;mez</surname>
<given-names>R. U. &#xc1;.</given-names>
</name>
<name>
<surname>P&#xe9;rez Olgu&#xed;n</surname>
<given-names>I. J. C.</given-names>
</name>
<name>
<surname>P&#xe9;rez Dom&#xed;nguez</surname>
<given-names>L. A.</given-names>
</name>
<name>
<surname>Rodr&#xed;guez-Pic&#xf3;n</surname>
<given-names>L. A.</given-names>
</name>
<name>
<surname>M&#xe9;ndez-Gonz&#xe1;lez</surname>
<given-names>L. C.</given-names>
</name>
</person-group> (<year>2023</year>). &#x201c;<article-title>Distribution route optimization using floyd-warshall weighted graph analysis algorithm with google maps integration in industry 4.0 context</article-title>,&#x201d; in <source>Innovation and competitiveness in industry 4.0 based on intelligent systems</source> (<publisher-name>Springer</publisher-name>), <fpage>287</fpage>&#x2013;<lpage>305</lpage>.</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gupta</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Watson</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Yin</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Deep learning-based aerial image segmentation with open data for disaster impact assessment</article-title>. <source>Neurocomputing</source> <volume>439</volume>, <fpage>22</fpage>&#x2013;<lpage>33</lpage>. <pub-id pub-id-type="doi">10.1016/j.neucom.2020.02.139</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Ban</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Nascetti</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Uni-temporal multispectral imagery for burned area mapping with deep learning</article-title>. <source>Remote Sens.</source> <volume>13</volume>, <fpage>1509</fpage>. <pub-id pub-id-type="doi">10.3390/rs13081509</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Ban</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Rahnemoonfar</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2023a</year>). <article-title>Gan-based sar and optical image translation for wildfire impact assessment using multi-source remote sensing data</article-title>. <source>Remote Sens. Environ.</source> <volume>289</volume>, <fpage>113522</fpage>. <pub-id pub-id-type="doi">10.1016/j.rse.2023.113522</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Hu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zuo</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Iannucci</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Joe-Wong</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2023b</year>). &#x201c;<article-title>Intelligent communication planning for constrained environmental iot sensing with reinforcement learning</article-title>,&#x201d; in <conf-name>2023 20th Annual IEEE International Conference on Sensing, Communication, and Networking (SECON)</conf-name> (<publisher-name>IEEE</publisher-name>), <fpage>357</fpage>&#x2013;<lpage>365</lpage>.</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>An</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Ning</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Tiwari</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Uniformity and deformation: a benchmark for multi-fish real-time tracking in the farming</article-title>. <source>Expert Syst. Appl.</source> <volume>264</volume>, <fpage>125653</fpage>. <pub-id pub-id-type="doi">10.1016/j.eswa.2024.125653</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huot</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>R. L.</given-names>
</name>
<name>
<surname>Goyal</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Sankar</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Ihme</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y. F.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Next day wildfire spread: a machine learning dataset to predict wildfire spreading from remote-sensing data</article-title>. <source>IEEE Trans. Geoscience Remote Sens.</source> <volume>60</volume>, <fpage>1</fpage>&#x2013;<lpage>13</lpage>. <pub-id pub-id-type="doi">10.1109/tgrs.2022.3192974</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jiang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Liang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Ziegler</surname>
<given-names>A. D.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Rapid and large-scale mapping of flood inundation via integrating spaceborne synthetic aperture radar imagery with unsupervised deep learning</article-title>. <source>ISPRS J. photogrammetry remote Sens.</source> <volume>178</volume>, <fpage>36</fpage>&#x2013;<lpage>50</lpage>. <pub-id pub-id-type="doi">10.1016/j.isprsjprs.2021.05.019</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Karimzadeh</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ghasemi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Matsuoka</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Yagi</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Zulfikar</surname>
<given-names>A. C.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>A deep learning model for road damage detection after an earthquake based on synthetic aperture radar (sar) and field datasets</article-title>. <source>IEEE J. Sel. Top. Appl. Earth Observations Remote Sens.</source> <volume>15</volume>, <fpage>5753</fpage>&#x2013;<lpage>5765</lpage>. <pub-id pub-id-type="doi">10.1109/jstars.2022.3189875</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kodipalli</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Fernandes</surname>
<given-names>S. L.</given-names>
</name>
<name>
<surname>Dasar</surname>
<given-names>S. K.</given-names>
</name>
<name>
<surname>Ismail</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Computational framework of inverted fuzzy c-means and quantum convolutional neural network towards accurate detection of ovarian tumors</article-title>. <source>Int. J. E-Health Med. Commun. (IJEHMC)</source> <volume>14</volume>, <fpage>1</fpage>&#x2013;<lpage>16</lpage>. <pub-id pub-id-type="doi">10.4018/ijehmc.321149</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lasaponara</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Fattore</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Modica</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Imaging burned areas and fire severity in mediterranean fragmented ecosystems using sentinel-1 and sentinel-2: the case study of tortoli&#x2013;ogliastra fire (sardinia)</article-title>. <source>IEEE Geoscience Remote Sens. Lett.</source> <volume>20</volume>, <fpage>1</fpage>&#x2013;<lpage>5</lpage>. <pub-id pub-id-type="doi">10.1109/lgrs.2023.3324945</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname>
<given-names>I. K.</given-names>
</name>
<name>
<surname>Trinder</surname>
<given-names>J. C.</given-names>
</name>
<name>
<surname>Sowmya</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Application of u-net convolutional neural network to bushfire monitoring in Australia with sentinel-1/-2 data</article-title>. <source>Int. Archives Photogrammetry, Remote Sens. Spatial Inf. Sci.</source> <volume>43</volume>, <fpage>573</fpage>&#x2013;<lpage>578</lpage>. <pub-id pub-id-type="doi">10.5194/isprs-archives-xliii-b1-2020-573-2020</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mirahadi</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>McCabe</surname>
<given-names>B. Y.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Evacusafe: a real-time model for building evacuation based on dijkstra&#x2019;s algorithm</article-title>. <source>J. Build. Eng.</source> <volume>34</volume>, <fpage>101687</fpage>. <pub-id pub-id-type="doi">10.1016/j.jobe.2020.101687</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nur</surname>
<given-names>A. S.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>Y. J.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>C. W.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Creation of wildfire susceptibility maps in plumas national forest using insar coherence, deep learning, and metaheuristic optimization approaches</article-title>. <source>Remote Sens.</source> <volume>14</volume>, <fpage>4416</fpage>. <pub-id pub-id-type="doi">10.3390/rs14174416</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Oliva</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Medina</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Dur&#xe1;n</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Vidal</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2020</year>). &#x201c;<article-title>Improved biomass and burning efficiency factors for forest fire emissions estimation in central Chile</article-title>,&#x201d; in <conf-name>2020 IEEE Latin American GRSS and ISPRS Remote Sensing Conference (LAGIRS)</conf-name>, <conf-loc>Santiago, Chile</conf-loc>, <conf-date>22&#x2013;26 March, 2020</conf-date> (<publisher-name>IEEE</publisher-name>), <fpage>477</fpage>&#x2013;<lpage>482</lpage>.</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pi</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Nath</surname>
<given-names>N. D.</given-names>
</name>
<name>
<surname>Behzadan</surname>
<given-names>A. H.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Convolutional neural networks for object detection in aerial imagery for disaster response and recovery</article-title>. <source>Adv. Eng. Inf.</source> <volume>43</volume>, <fpage>101009</fpage>. <pub-id pub-id-type="doi">10.1016/j.aei.2019.101009</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Poudel</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Moh</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Hybrid path planning for efficient data collection in uav-aided wsns for emergency applications</article-title>. <source>Sensors</source> <volume>21</volume>, <fpage>2839</fpage>. <pub-id pub-id-type="doi">10.3390/s21082839</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Salami</surname>
<given-names>O. B.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>A. R.</given-names>
</name>
<name>
<surname>Pushparaj</surname>
<given-names>R. I.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Underground mining fire hazards and the optimization of emergency evacuation strategies (ees): the issues, existing methodology and limitations, and way forward</article-title>. <source>Process Saf. Environ. Prot.</source> <volume>177</volume>, <fpage>617</fpage>&#x2013;<lpage>634</lpage>. <pub-id pub-id-type="doi">10.1016/j.psep.2023.07.012</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sannidhan</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Martis</surname>
<given-names>J. E.</given-names>
</name>
<name>
<surname>Nayak</surname>
<given-names>R. S.</given-names>
</name>
<name>
<surname>Aithal</surname>
<given-names>S. K.</given-names>
</name>
<name>
<surname>Sudeepa</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Detection of antibiotic constituent in aspergillus flavus using quantum convolutional neural network</article-title>. <source>Int. J. E-Health Med. Commun. (IJEHMC)</source> <volume>14</volume>, <fpage>1</fpage>&#x2013;<lpage>26</lpage>. <pub-id pub-id-type="doi">10.4018/ijehmc.321150</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sharma</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Andersen</surname>
<given-names>P. A.</given-names>
</name>
<name>
<surname>Granmo</surname>
<given-names>O. C.</given-names>
</name>
<name>
<surname>Goodwin</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Deep q-learning with q-matrix transfer learning for novel fire evacuation environment</article-title>. <source>IEEE Trans. Syst. Man, Cybern. Syst.</source> <volume>51</volume>, <fpage>7363</fpage>&#x2013;<lpage>7381</lpage>. <pub-id pub-id-type="doi">10.1109/tsmc.2020.2967936</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Subramanian</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Rajesh</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Britto</surname>
<given-names>P. I.</given-names>
</name>
<name>
<surname>Sankaran</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Mdho: mayfly deer hunting optimization algorithm for optimal obstacle avoidance based path planning using mobile robots</article-title>. <source>Cybern. Syst.</source>, <fpage>1</fpage>&#x2013;<lpage>20</lpage>. <pub-id pub-id-type="doi">10.1080/01969722.2023.2177804</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Hua</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Mou</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>X. X.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Cg-net: conditional gis-aware network for individual building segmentation in vhr sar images</article-title>. <source>IEEE Trans. Geoscience Remote Sens.</source> <volume>60</volume>, <fpage>1</fpage>&#x2013;<lpage>15</lpage>. <pub-id pub-id-type="doi">10.1109/tgrs.2020.3043089</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Sun</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Lv</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2024</year>). &#x201c;<article-title>Multi-uav trajectory planning based on improved multi-population grey wolf optimizer algorithm</article-title>,&#x201d; in <conf-name>2024 36th Chinese control and decision conference (CCDC)</conf-name> (<publisher-name>IEEE</publisher-name>), <fpage>6142</fpage>&#x2013;<lpage>6148</lpage>.</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tian</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Forest fire spread monitoring and vegetation dynamics detection based on multi-source remote sensing images</article-title>. <source>Remote Sens.</source> <volume>14</volume>, <fpage>4431</fpage>. <pub-id pub-id-type="doi">10.3390/rs14184431</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tlijani</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Jouila</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Nouri</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Optimized sliding mode control based on cuckoo search algorithm: application for 2df robot manipulator</article-title>. <source>Cybern. Syst.</source>, <fpage>1</fpage>&#x2013;<lpage>17</lpage>. <pub-id pub-id-type="doi">10.1080/01969722.2023.2247259</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>&#xdc;nal</surname>
<given-names>A. E.</given-names>
</name>
<name>
<surname>Gezer</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Pak</surname>
<given-names>B. K.</given-names>
</name>
<name>
<surname>G&#xfc;ng&#xf6;r</surname>
<given-names>V. &#xc7;.</given-names>
</name>
</person-group> (<year>2022</year>). &#x201c;<article-title>Generating emergency evacuation route directions based on crowd simulations with reinforcement learning</article-title>,&#x201d; in <conf-name>2022 Innovations in Intelligent Systems and Applications Conference (ASYU)</conf-name>, <conf-loc>Antalya, Turkey</conf-loc>, <conf-date>07&#x2013;09 September, 2022</conf-date> (<publisher-name>IEEE</publisher-name>), <fpage>1</fpage>&#x2013;<lpage>6</lpage>.</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2025b</year>). <article-title>A unified framework for adversarial patch attacks against visual 3d object detection in autonomous driving</article-title>. <source>IEEE Trans. Circuits Syst. Video Technol.</source>, <fpage>1</fpage>. <pub-id pub-id-type="doi">10.1109/tcsvt.2025.3525725</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Lv</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2025a</year>). <article-title>Physically realizable adversarial creating attack against vision-based bev space 3d object detection</article-title>. <source>IEEE Trans. Image Process.</source> <volume>34</volume>, <fpage>538</fpage>&#x2013;<lpage>551</lpage>. <pub-id pub-id-type="doi">10.1109/tip.2025.3526056</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>New productive forces: indicator construction and spatio-temporal evolution</article-title>. <source>J. Xi&#x2019;an Univ. Finance Econ.</source> <volume>37</volume>, <fpage>31</fpage>&#x2013;<lpage>47</lpage>.</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Luan</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Quan</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Joint flying relay location and routing optimization for 6g uav&#x2013;iot networks: a graph neural network-based approach</article-title>. <source>Remote Sens.</source> <volume>14</volume>, <fpage>4377</fpage>. <pub-id pub-id-type="doi">10.3390/rs14174377</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wei</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Song</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Qin</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Research on evacuation path planning based on improved sparrow search algorithm</article-title>. <source>CMES-Computer Model. Eng. and Sci.</source> <volume>139</volume>, <fpage>1295</fpage>&#x2013;<lpage>1316</lpage>. <pub-id pub-id-type="doi">10.32604/cmes.2023.045096</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y. F.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Intelligent planning of fire evacuation routes using an improved ant colony optimization algorithm</article-title>. <source>J. Build. Eng.</source> <volume>61</volume>, <fpage>105208</fpage>. <pub-id pub-id-type="doi">10.1016/j.jobe.2022.105208</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Passenger evacuation path planning in subway station under multiple fires based on multiobjective robust optimization</article-title>. <source>IEEE Trans. Intelligent Transp. Syst.</source> <volume>23</volume>, <fpage>21915</fpage>&#x2013;<lpage>21931</lpage>. <pub-id pub-id-type="doi">10.1109/tits.2022.3190291</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Young</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Aguirre</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Prioritevac: an agent-based model (abm) for examining social factors of building fire evacuation</article-title>. <source>Inf. Syst. Front.</source> <volume>23</volume>, <fpage>1083</fpage>&#x2013;<lpage>1096</lpage>. <pub-id pub-id-type="doi">10.1007/s10796-020-10074-9</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhenhua</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>New development concept to accelerate the formation of new productive forces: theoretical logic and implementation path</article-title>. <source>J. Xi&#x2019;an Univ. Finance Econ.</source> <volume>37</volume>, <fpage>3</fpage>&#x2013;<lpage>14</lpage>.</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Gong</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Hdrlm3d: a deep reinforcement learning-based model with human-like perceptron and policy for crowd evacuation in 3d environments</article-title>. <source>ISPRS Int. J. Geo-Information</source> <volume>11</volume>, <fpage>255</fpage>. <pub-id pub-id-type="doi">10.3390/ijgi11040255</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wei</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>An</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Ning</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Self-supervised learning-based multi-source spectral fusion for fruit quality evaluation: a case study in mango fruit ripeness prediction</article-title>. <source>Inf. Fusion</source> <volume>117</volume>, <fpage>102814</fpage>. <pub-id pub-id-type="doi">10.1016/j.inffus.2024.102814</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Ban</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Nascetti</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Learning u-net without forgetting for near real-time wildfire monitoring by the fusion of sar and optical time series</article-title>. <source>Remote Sens. Environ.</source> <volume>261</volume>, <fpage>112467</fpage>. <pub-id pub-id-type="doi">10.1016/j.rse.2021.112467</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Chu</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Xiao</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Research on escape route planning analysis in forest fire scenes based on the improved a&#x2a; algorithm</article-title>. <source>Ecol. Indic.</source> <volume>166</volume>, <fpage>112355</fpage>. <pub-id pub-id-type="doi">10.1016/j.ecolind.2024.112355</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>