<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" dtd-version="1.3" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Public Health</journal-id>
<journal-title-group>
<journal-title>Frontiers in Public Health</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Public Health</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2296-2565</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpubh.2025.1644499</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Online bipartite matching methodology for anti-epidemic resources allocation: an adaptive time window based on reinforcement learning</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Wu</surname> <given-names>Zhiyong</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x02020;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<uri xlink:href="https://loop.frontiersin.org/people/3095902"/>
</contrib>
<contrib contrib-type="author" corresp="yes" equal-contrib="yes">
<name><surname>Pang</surname> <given-names>Sulin</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x02020;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<uri xlink:href="https://loop.frontiersin.org/people/1985125"/>
</contrib>
<contrib contrib-type="author">
<name><surname>He</surname> <given-names>Suyan</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<uri xlink:href="https://loop.frontiersin.org/people/3319237"/>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>School of Digital Economics and Trade, Guangzhou Huashang College</institution>, <city>Guangzhou</city>, <country country="cn">China</country></aff>
<aff id="aff2"><label>2</label><institution>Institute of Finance Engineering/School of Emergency Management, Jinan University</institution>, <city>Guangzhou</city>, <country country="cn">China</country></aff>
<aff id="aff3"><label>3</label><institution>Department of Economics, Guangdong Institute of Public Administration</institution>, <city>Guangzhou</city>, <country country="cn">China</country></aff>
<author-notes>
<corresp id="c001"><label>&#x0002A;</label>Correspondence: Sulin Pang, <email xlink:href="mailto:pangsulin@jnu.edu.cn">pangsulin@jnu.edu.cn</email></corresp>
<fn fn-type="equal" id="fn001"><label>&#x02020;</label><p>These authors have contributed equally to this work and share first authorship</p></fn></author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-01-08">
<day>08</day>
<month>01</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2025</year>
</pub-date>
<volume>13</volume>
<elocation-id>1644499</elocation-id>
<history>
<date date-type="received">
<day>16</day>
<month>06</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>30</day>
<month>09</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>02</day>
<month>12</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2026 Wu, Pang and He.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Wu, Pang and He</copyright-holder>
<license>
<ali:license_ref start_date="2026-01-08">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Background</title>
<p>This study aimed to investigate the online matching problem for anti-epidemic resources among multiple suppliers and recipients in the Internet of Healthcare System during a major outbreak. It accounts for the heterogeneity of supply and demand.</p></sec>
<sec>
<title>Methods</title>
<p>A multi-stage online dynamic bipartite matching model based on time windows is developed, which can be reformulated as a Markov decision process. An adaptive time window batch bipartite matching algorithm based on reinforcement learning is proposed, which utilizes the nearest neighbor&#x00027;s first heuristic strategy to allocate anti-epidemic resources.</p></sec>
<sec>
<title>Results</title>
<p>The optimal window size in <italic>fixed time window batch matching strategy</italic> (FTWBM) outperforms the results of <italic>adaptive time window batch matching strategy</italic> (ATWBM). However, the ATWBM strategy demonstrates greater effectiveness in adapting to the dynamic changes in epidemic prevention and control, particularly in partially optimistic scenarios.</p></sec>
<sec>
<title>Conclusions</title>
<p>The results revealed that, although the average matching rate consistently increases, the average waiting time initially decreases before rising again as the matching time window expands. This finding implies that health operations managers should modify the matching time window in response to changing epidemic dynamics and resource availability.</p></sec></abstract>
<kwd-group>
<kwd>major epidemics</kwd>
<kwd>bipartite matching</kwd>
<kwd>adaptive time window</kwd>
<kwd>resource allocation</kwd>
<kwd>reinforcement learning</kwd>
</kwd-group>
<funding-group>
 <funding-statement>The author(s) declared that financial support was received for this work and/or its publication. This work was supported by the Key Discipline Construction Project (Key Discipline &#x02013; International Business) of Guangzhou Huashang College (910108772), the National Natural Science Foundation of China (72374085), the Major Science and Technology Project of Guangzhou&#x00027;s R &#x00026; D Plan in Key Areas (20220602JBGS04), and the Guangzhou Philosophy and Social Science Planning Project under Grant 2025GZGJ366.</funding-statement>
</funding-group>
<counts>
<fig-count count="4"/>
<table-count count="3"/>
<equation-count count="15"/>
<ref-count count="29"/>
<page-count count="12"/>
<word-count count="8979"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Disaster and Emergency Medicine</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>Introduction</title>
<p>Major epidemics have consistently posed significant threats to human health and presented challenges to public health systems. They serve as a substantial test of governance structures and capacities (<xref ref-type="bibr" rid="B1">1</xref>). China is actively promoting the integration of information technologies with medical and healthcare services. This initiative has sparked a new wave of technological and management innovations, interconnected through the Internet of Healthcare Systems (HIS) and characterized by intelligent medical and healthcare management. Internet of Things (IoT) technology is utilized to monitor the utilization of medical resources, and corresponding resource allocation plans to meet demand are proposed (<xref ref-type="bibr" rid="B2">2</xref>). These sharing platforms have played a crucial role in helping individuals understand the dynamics of the epidemic and alleviate anxiety, as evidenced by their significant contributions to enhancing social emergency management capabilities during the pandemic.</p>
<p>Simultaneously, major epidemics create a severe and complex situation characterized by rapid and widespread transmission, which can lead to insufficient preventive measures and resource constraints. This has heightened the challenges associated with epidemic prevention and swift response. Consequently, the rapid advancements in smart medical technology and healthcare, the implementation of IoT technology, and the emergence of sharing platforms to facilitate the effective allocation of preventive resources have become critical demands in public health.</p>
<p>This study examines the online matching problem for anti-epidemic resources among multiple suppliers and recipients from the onset to the conclusion of major epidemic emergencies. The supply of anti-epidemic resources remains relatively stable over a short time frame and does not exceed the existing delivery capacity. However, it is constrained by the geographical scope of service. Typically, during an epidemic, the demand for anti-epidemic resources experiences a sudden surge, whereas the quantity supplied often falls short of the quantity demanded. Furthermore, suppliers and recipients exhibit heterogeneity. This study addresses three key questions: (1) Which strategy should be employed for matching anti-epidemic resources: instant matching or delayed batch matching? (2) If the delayed batch matching strategy is adopted, should the fixed time window matching strategy or the adaptive time window matching strategy be selected? (3) If the delayed batch matching strategy is implemented, what is the impact of the size of the matching time window on the outcomes of the matching decision?</p>
<p>In this study, we applied the matching model to address the allocation of anti-epidemic resources and propose a multi-stage online dynamic bipartite matching model (MSODBM). We transformed the problem into a Markov decision process and designed a reinforcement learning-based adaptive time window batch bipartite matching algorithm that employs the nearest neighbor first (NNF) heuristic strategy. The principal contributions can be summarized as follows: First, a multi-stage dynamic bipartite matching model for anti-epidemic resources is proposed to address online allocation problems with resource constraints. This model effectively integrates the sharing organization framework with the challenge of allocating anti-epidemic resources, representing a novel application of intelligent technology in this field. The traditional allocation of anti-epidemic resources mostly focuses on optimizing allocation at the group level through offline methods. Due to information asymmetry, it is difficult to achieve an efficient allocation of anti-epidemic resources at the individual level. The online approach based on sharing platforms provides new possibilities for resource allocation at the individual level. Second, an adaptive time window batch bipartite matching approach is proposed. Drawing on the exploration-exploitation trade-off concept from reinforcement learning, we use the minimum average waiting time as the learning reward and employ a heuristic strategy that prioritizes the nearest neighbor. Given unpredictable epidemic developments and dynamic fluctuations in supply and demand, there is no universally optimal or static matching time window. Maintaining a relatively high level of exploration for the matching time window plays a significant role in the effective allocation of resources. Third, a Hungarian-based many-to-many matching algorithm with capacity constraints is developed. The classic Hungarian algorithm primarily addresses the assignment of a single task or resource without accounting for the matching capacity or the many-to-many matching problem. Given the mismatch between the supply and demand of anti-epidemic resources, which constitutes a many-to-many matching challenge, it is essential to extend the classic Hungarian algorithm. This extension is achieved by incorporating a capacity attribute and refining the augmented-path search mechanism.</p>
<p>The remainder of this study is organized as follows. In Section 2, we review related work. Section 3 formally defines the problem. In Section 4, a multi-to-multi bipartite matching heuristic strategy and an algorithm based on a self-adaptive time window are proposed. Extensive experiments conducted on synthetic data are presented in Section 5. Finally, Section 6 provides managerial insights and outlines potential directions for future research.</p></sec>
<sec id="s2">
<title>Related literature</title>
<p>This study primarily engages with three streams of literature. The first stream is bipartite matching theory, also known as bipartite graph matching, which was originally developed to address the issue of inseparability in resource allocation (<xref ref-type="bibr" rid="B3">3</xref>, <xref ref-type="bibr" rid="B4">4</xref>). This theory has been applied to design matching mechanisms across various markets (<xref ref-type="bibr" rid="B5">5</xref>, <xref ref-type="bibr" rid="B6">6</xref>), including medical and healthcare, labor markets, school selection mechanisms, and kidney exchange markets. Roth (<xref ref-type="bibr" rid="B7">7</xref>) was the first to introduce the concept of bipartite matching and to define the terms &#x0201C;bipartite&#x0201D; and &#x0201C;bipartite matching.&#x0201D; A series of research findings has emerged based on the one-sided vertex arrival model (<xref ref-type="bibr" rid="B8">8</xref>). Some scholars have explored the bipartite matching problem under sequential arrival conditions (<xref ref-type="bibr" rid="B9">9</xref>), edge-weighted online bipartite matching problems (<xref ref-type="bibr" rid="B10">10</xref>), non-stationary online bipartite matching problems (<xref ref-type="bibr" rid="B11">11</xref>), and online matching problems with random rewards (<xref ref-type="bibr" rid="B12">12</xref>). In the current literature, user arrival information is categorized into adversarial and Bayesian arrivals based on the sequence of users arriving online. The occurrence of major epidemics is often sudden, leading to uncertainty in the timing and quantity of information from suppliers and recipients. Consequently, the online matching problem is characterized as an adversarial complete online matching problem.</p>
<p>The second stream is the sharing economy. The sharing economy enhances the efficiency of utilizing decentralized private assets by facilitating large-scale collaborative activities among individuals (<xref ref-type="bibr" rid="B13">13</xref>). Serving as a link among suppliers and recipients, sharing platforms integrate offline idle items, labor, and resources, enabling effective matching and trading of resources, which ultimately leads to profit generation. These platforms employ location-based technologies and algorithms to search for and match resources, providing users with information sorted by these algorithms in real time (<xref ref-type="bibr" rid="B14">14</xref>). An efficient recommendation system, supported by big data analysis and machine learning, improves matching efficiency and helps alleviate the &#x0201C;information problem&#x0201D; (<xref ref-type="bibr" rid="B13">13</xref>). Existing studies provide valuable insights for addressing online matching challenges.</p>
<p>The third stream focuses on emergency resource allocation during public health events. In the event of a public health emergency, the most affected areas may encounter various challenges due to insufficient medical personnel and supplies (<xref ref-type="bibr" rid="B15">15</xref>). Given the constraints of limited resources, a critical issue is how to allocate these resources effectively across different areas of demand to control the epidemic as swiftly and effectively as possible (<xref ref-type="bibr" rid="B16">16</xref>). To enhance the effective allocation of emergency resources, some researchers have developed collaborative emergency medical resource allocation models driven by epidemic forecasts to address collaborative decision-making challenges with multiple objectives (<xref ref-type="bibr" rid="B17">17</xref>). A demand forecasting model with a general demand forecasting function was constructed to address the short-sighted behavior often observed in medical resource allocation (<xref ref-type="bibr" rid="B18">18</xref>). In response to the multi-regional Ebola outbreak, a two-stage model was established, taking into account a limited medical treatment team to determine both the timing of resource allocation decisions and the quantity of resources allocated (<xref ref-type="bibr" rid="B19">19</xref>). Considering the high volatility and time-varying characteristics of COVID-19, a multi-stage, multi-type online medical service model was developed (<xref ref-type="bibr" rid="B20">20</xref>). Additionally, some scholars have proposed a meta-population online resource allocation and epidemic transmission coupling model (<xref ref-type="bibr" rid="B21">21</xref>), examined the fairness of vaccine resource allocation (<xref ref-type="bibr" rid="B22">22</xref>), and analyzed the space-time competition of medical supply and demand (<xref ref-type="bibr" rid="B23">23</xref>).</p>
<p>Based on a review of the existing literature, this study identifies two significant research gaps. First, while some studies have examined decision-making in the allocation of emergency resources for public health crises, the focus has primarily been on predictive and optimized resource allocation methods. There is a scarcity of literature addressing the application of shared organizational models in the context of allocating resources for public health emergencies. Second, although new resource organization models based on sharing platforms have been widely adopted in sectors such as transportation, goods delivery, housing leasing, and online medical consultations, there is limited literature on the application of spatial-temporal online matching methods to allocate public health emergency resources. Furthermore, the emergence of resource allocation models based on sharing platforms presents new opportunities for the efficient allocation of anti-epidemic resources in the digital age.</p></sec>
<sec id="s3">
<title>Model formulation</title>
<sec>
<title>Problem definition</title>
<p>The HIS platform connects individuals, objects, and their informational resources in both fixed and mobile environments through high-speed communication networks (<xref ref-type="bibr" rid="B24">24</xref>). This connectivity effectively coordinates the allocation of anti-epidemic resources. The online matching problem primarily involves pairing suitable resources from suppliers with recipients affected by the epidemic. The HIS allocates anti-epidemic resources among recipients and suppliers according to online matching rules, aiming to fulfill the needs for these resources as quickly and broadly as possible (<xref ref-type="fig" rid="F1">Figure 1</xref>). In the pursuit of maximizing resource matching, the deployment time of anti-epidemic resources emerges as a critical influencing factor that plays a vital role in effectively managing the epidemic. Therefore, we concentrate on maximizing the matching of anti-epidemic resources while minimizing the total waiting time.</p>
<fig position="float" id="F1">
<label>Figure 1</label>
<caption><p>The HIS of anti-epidemic resource management.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpubh-13-1644499-g0001.tif">
<alt-text content-type="machine-generated">Diagram showing an Internet of Healthcare Sharing System. Infected and non-infected area recipients post resource requests and receive matching results. The system uses an online matching mechanism with resource demand and supply management for anti-epidemic resources such as health workers and vaccines. Suppliers share resource information and get matching results across three levels.</alt-text>
</graphic>
</fig>
<p>The recipient <italic>i</italic> &#x02208; <bold><italic>D</italic></bold> and the resource supplier <italic>j</italic> &#x02208; <bold><italic>S</italic></bold> dynamically arrive at HIS in a time series order. Recipient <italic>i</italic> can be represented by a quintuple <italic>i</italic> &#x0003D; (<italic>id</italic><sub><italic>i</italic></sub>, <italic>loc</italic><sub><italic>i</italic></sub>, <italic>dr</italic><sub><italic>i</italic></sub>, <italic>requesttime</italic><sub><italic>i</italic></sub>, <italic>q</italic><sub><italic>i</italic></sub>), where <italic>id</italic><sub><italic>i</italic></sub> indicates a specific identifier, <italic>loc</italic><sub><italic>i</italic></sub> indicates the location, <italic>dr</italic><sub><italic>i</italic></sub> &#x02208; {<italic>high, low</italic>} indicates the epidemic prevention level, <italic>requesttime</italic><sub><italic>i</italic></sub> indicates the request time, and <italic>q</italic><sub><italic>i</italic></sub> indicates the required quantity. Supplier <italic>j</italic> is represented by <italic>j</italic> &#x0003D; (<italic>id</italic><sub><italic>j</italic></sub>, <italic>loc</italic><sub><italic>j</italic></sub>, s<italic>r</italic><sub><italic>j</italic></sub>, <italic>requesttime</italic><sub><italic>j</italic></sub>, <italic>q</italic><sub><italic>j</italic></sub>, <italic>l</italic><sub><italic>j</italic></sub>), where <italic>id</italic><sub><italic>j</italic></sub> indicates a specific identifier, <italic>loc</italic><sub><italic>j</italic></sub> indicates the location, <italic>sr</italic><sub><italic>j</italic></sub> &#x02208; {1, 2, 3} indicates the supply level, <italic>requesttime</italic><sub><italic>j</italic></sub> indicates the supply time, <italic>q</italic><sub><italic>j</italic></sub> indicates the quantity supplied, and <italic>l</italic><sub><italic>j</italic></sub> indicates the largest geographical range that <italic>j</italic> can be supplied.</p>
<p>Anti-epidemic resources are categorized into both reusable and non-reusable types. The resource matching set <bold><italic>M</italic></bold> encompasses all matching responses requested by both the supplier and the recipient. Each response can be represented by a quintuple (<italic>i, j, q</italic><sub><italic>ij</italic></sub>, &#x003C4;<sub><italic>ij</italic></sub>, <italic>rate</italic><sub><italic>ij</italic></sub>), where <italic>i</italic> indicates the request from the recipient, <italic>j</italic> indicates the supplier capable of providing resources to <italic>i</italic>, <italic>q</italic><sub><italic>ij</italic></sub> indicates the quantity of resources that <italic>j</italic> can provide to <italic>i</italic>, &#x003C4;<sub><italic>ij</italic></sub> indicates the waiting time required for <italic>i</italic> to <italic>j</italic>, and <italic>rate</italic><sub><italic>ij</italic></sub> indicates the resource matching rate between <italic>j</italic> and <italic>i</italic>.</p></sec>
<sec>
<title>Model formulation</title>
<p>The foundational model is articulated as follows.</p>
<disp-formula id="EQ1"><mml:math id="M1"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mstyle mathvariant="bold-italic"><mml:mi>o</mml:mi><mml:mi>b</mml:mi><mml:mi>j</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>v</mml:mi><mml:mi>e</mml:mi></mml:mstyle><mml:mstyle mathvariant="bold-italic"><mml:mo>.</mml:mo><mml:mi>m</mml:mi><mml:mi>a</mml:mi><mml:mi>x</mml:mi></mml:mstyle><mml:mtext>&#x000A0;</mml:mtext><mml:mi>f</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:munderover accentunder="false" accent="false"><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>D</mml:mi></mml:mrow></mml:munderover></mml:mstyle><mml:mstyle displaystyle="true"><mml:munderover accentunder="false" accent="false"><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mi>S</mml:mi></mml:mrow></mml:munderover></mml:mstyle><mml:msub><mml:mrow><mml:mi>q</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(1)</label></disp-formula>
<disp-formula id="EQ2"><mml:math id="M2"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mstyle mathvariant="bold-italic"><mml:mi>s</mml:mi></mml:mstyle><mml:mstyle mathvariant="bold-italic"><mml:mo>.</mml:mo><mml:mi>t</mml:mi></mml:mstyle><mml:mstyle mathvariant="bold-italic"><mml:mo>.</mml:mo></mml:mstyle><mml:mtext>&#x000A0;</mml:mtext><mml:mstyle displaystyle="true"><mml:munderover accentunder="false" accent="false"><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mi>S</mml:mi></mml:mrow></mml:munderover></mml:mstyle><mml:msub><mml:mrow><mml:mi>q</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>&#x02264;</mml:mo><mml:msub><mml:mrow><mml:mi>q</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>,</mml:mo><mml:mtext>&#x000A0;</mml:mtext><mml:mi>i</mml:mi><mml:mo>&#x02208;</mml:mo><mml:mi>D</mml:mi></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(2)</label></disp-formula>
<disp-formula id="EQ3"><mml:math id="M3"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mstyle displaystyle="true"><mml:munderover accentunder="false" accent="false"><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>D</mml:mi></mml:mrow></mml:munderover></mml:mstyle><mml:msub><mml:mrow><mml:mi>q</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>&#x02264;</mml:mo><mml:msub><mml:mrow><mml:mi>q</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>,</mml:mo><mml:mtext>&#x000A0;</mml:mtext><mml:mi>j</mml:mi><mml:mo>&#x02208;</mml:mo><mml:mi>S</mml:mi></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(3)</label></disp-formula>
<disp-formula id="EQ4"><mml:math id="M4"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>l</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>&#x02264;</mml:mo><mml:msub><mml:mrow><mml:mi>l</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(4)</label></disp-formula>
<disp-formula id="EQ5"><mml:math id="M5"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mstyle displaystyle="true"><mml:munderover accentunder="false" accent="false"><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mi>S</mml:mi></mml:mrow></mml:munderover></mml:mstyle><mml:msub><mml:mrow><mml:mi>q</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mn>0</mml:mn><mml:mo>,</mml:mo><mml:mtext>&#x000A0;</mml:mtext><mml:mo>&#x02200;</mml:mo><mml:mi>d</mml:mi><mml:msub><mml:mrow><mml:mi>r</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>&#x0003C;</mml:mo><mml:mi>d</mml:mi><mml:msub><mml:mrow><mml:mi>r</mml:mi></mml:mrow><mml:mrow><mml:msup><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>&#x02032;</mml:mi></mml:mrow></mml:msup></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:mtext>&#x000A0;</mml:mtext><mml:mi>i</mml:mi><mml:mo>,</mml:mo><mml:msup><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>&#x02032;</mml:mi></mml:mrow></mml:msup><mml:mo>&#x02208;</mml:mo><mml:mi>D</mml:mi></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(5)</label></disp-formula>
<disp-formula id="EQ6"><mml:math id="M6"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mstyle displaystyle="true"><mml:munderover accentunder="false" accent="false"><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mstyle mathvariant="bold-italic"><mml:mi>D</mml:mi></mml:mstyle></mml:mrow></mml:munderover></mml:mstyle><mml:msub><mml:mrow><mml:mi>q</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mn>0</mml:mn><mml:mo>,</mml:mo><mml:mtext>&#x000A0;</mml:mtext><mml:mo>&#x02200;</mml:mo><mml:mi>s</mml:mi><mml:msub><mml:mrow><mml:mi>r</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>&#x0003E;</mml:mo><mml:mi>s</mml:mi><mml:msub><mml:mrow><mml:mi>r</mml:mi></mml:mrow><mml:mrow><mml:msup><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mi>&#x02032;</mml:mi></mml:mrow></mml:msup></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:mi>j</mml:mi><mml:mo>,</mml:mo><mml:msup><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mi>&#x02032;</mml:mi></mml:mrow></mml:msup><mml:mo>&#x02208;</mml:mo><mml:mstyle mathvariant="bold-italic"><mml:mi>S</mml:mi></mml:mstyle></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(6)</label></disp-formula>
<disp-formula id="EQ7"><mml:math id="M7"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mi>q</mml:mi><mml:mi>u</mml:mi><mml:mi>e</mml:mi><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>m</mml:mi><mml:msub><mml:mrow><mml:mi>e</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>&#x02264;</mml:mo><mml:mi>t</mml:mi><mml:mo>,</mml:mo><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mi>q</mml:mi><mml:mi>u</mml:mi><mml:mi>e</mml:mi><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>m</mml:mi><mml:msub><mml:mrow><mml:mi>e</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>&#x02264;</mml:mo><mml:mi>t</mml:mi></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(7)</label></disp-formula>
<disp-formula id="EQ8"><mml:math id="M8"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>q</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd><mml:mtd><mml:mo>&#x02265;</mml:mo></mml:mtd><mml:mtd><mml:mn>0</mml:mn><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>q</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>&#x02208;</mml:mo><mml:mstyle mathvariant="bold-italic"><mml:mi>Z</mml:mi></mml:mstyle><mml:mo>,</mml:mo><mml:mi>i</mml:mi><mml:mo>&#x02208;</mml:mo><mml:mstyle mathvariant="bold-italic"><mml:mi>D</mml:mi></mml:mstyle><mml:mo>,</mml:mo><mml:mtext>&#x000A0;</mml:mtext><mml:mi>j</mml:mi><mml:mo>&#x02208;</mml:mo><mml:mstyle mathvariant="bold-italic"><mml:mi>S</mml:mi></mml:mstyle></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(8)</label></disp-formula>
<disp-formula id="EQ9"><mml:math id="M9"><mml:mrow><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo stretchy='false'>(</mml:mo><mml:mi>t</mml:mi><mml:mo stretchy='false'>)</mml:mo><mml:mo>=</mml:mo><mml:mrow><mml:mo>{</mml:mo><mml:mrow><mml:mtable columnalign='left'><mml:mtr columnalign='left'><mml:mtd columnalign='left'><mml:mrow><mml:mn>1</mml:mn><mml:mo>,</mml:mo><mml:mtext>&#x000A0;it&#x000A0;is&#x000A0;matched&#x000A0;between&#x000A0;</mml:mtext><mml:mi>i</mml:mi><mml:mtext>&#x000A0;and&#x000A0;</mml:mtext><mml:mi>j</mml:mi></mml:mrow></mml:mtd></mml:mtr><mml:mtr columnalign='left'><mml:mtd columnalign='left'><mml:mrow><mml:mn>0</mml:mn><mml:mo>,</mml:mo><mml:mtext>&#x000A0;it&#x000A0;is&#x000A0;not&#x000A0;matched&#x000A0;between&#x000A0;</mml:mtext><mml:mi>i</mml:mi><mml:mtext>&#x000A0;and&#x000A0;</mml:mtext><mml:mi>j</mml:mi></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:mrow></mml:mrow></mml:mrow></mml:math><label>(9)</label></disp-formula>
<p>The objective (<xref ref-type="bibr" rid="B1">1</xref>) of the model is to maximize the total quantity of resource matching. Constraint (<xref ref-type="bibr" rid="B2">2</xref>) ensures that each recipient <italic>i</italic> can obtain anti-epidemic resources that do not exceed their demand during the decision period <italic>t</italic>. Constraint (<xref ref-type="bibr" rid="B3">3</xref>) ensures that the supplier <italic>j</italic> can provide anti-epidemic resources without exceeding their maximum quantity. Constraint (<xref ref-type="bibr" rid="B4">4</xref>) indicates that the supplier <italic>j</italic> must provide resources to the recipient <italic>i</italic> within their service radius. Constraint (<xref ref-type="bibr" rid="B5">5</xref>) prioritizes the recipient <italic>i</italic>with a high level of epidemic prevention. Constraint (<xref ref-type="bibr" rid="B6">6</xref>) prioritizes suppliers <italic>j</italic> with a low supply level. Constraint (<xref ref-type="bibr" rid="B7">7</xref>) indicates that both the recipient <italic>i</italic> and the supplier <italic>j</italic> must arrive at the platform within the matching time window <italic>t</italic>. Constraint (<xref ref-type="bibr" rid="B8">8</xref>) ensures that the quantity of anti-epidemic resources allocated by suppliers to recipients is a non-negative integer. Constraint (<xref ref-type="bibr" rid="B9">9</xref>) indicates whether the supplier <italic>j</italic> allocates resources to the recipient <italic>i</italic>.</p>
<p>The MSODBM is a temporal and spatial dynamic decision-making problem characterized by unpredictability, major outbreaks, and limited information. The arrival of recipients and suppliers in the HIS is marked by uncertainty regarding both timing and quantity. The decision-making process for matching anti-epidemic resources is not only influenced by the current state of events but also has implications for the progression of future events. Given that the number of recipients and suppliers participating in the matching process, as well as the quantity of requested resources, varies across different matching time windows, the <italic>average wait time</italic> and the <italic>average matching rate</italic> serve as critical indicators for evaluating the outcomes of matching.</p>
<p>The total waiting time &#x003C4;<sub><italic>i</italic></sub> consists of waiting for the matching time <inline-formula><mml:math id="M10"><mml:msubsup><mml:mrow><mml:mi>&#x003C4;</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>b</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>c</mml:mi><mml:mi>h</mml:mi></mml:mrow></mml:msubsup></mml:math></inline-formula> and the travel time <inline-formula><mml:math id="M11"><mml:msubsup><mml:mrow><mml:mi>&#x003C4;</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mi>r</mml:mi><mml:mi>a</mml:mi><mml:mi>v</mml:mi><mml:mi>e</mml:mi><mml:mi>l</mml:mi></mml:mrow></mml:msubsup></mml:math></inline-formula>. <inline-formula><mml:math id="M12"><mml:msubsup><mml:mrow><mml:mi>&#x003C4;</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>b</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>c</mml:mi><mml:mi>h</mml:mi></mml:mrow></mml:msubsup></mml:math></inline-formula> refers to the difference between the match time and the request time for anti-epidemic resources. i.e., <inline-formula><mml:math id="M13"><mml:msubsup><mml:mrow><mml:mi>&#x003C4;</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>b</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>c</mml:mi><mml:mi>h</mml:mi></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:mi>m</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>c</mml:mi><mml:mi>h</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>m</mml:mi><mml:msub><mml:mrow><mml:mi>e</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mi>q</mml:mi><mml:mi>u</mml:mi><mml:mi>e</mml:mi><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>m</mml:mi><mml:msub><mml:mrow><mml:mi>e</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>. <inline-formula><mml:math id="M14"><mml:msubsup><mml:mrow><mml:mi>&#x003C4;</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>b</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>c</mml:mi><mml:mi>h</mml:mi></mml:mrow></mml:msubsup></mml:math></inline-formula> is influenced by the capacity of resource supply, the selection of time windows for platform matching, and the matching strategy employed. <inline-formula><mml:math id="M15"><mml:msubsup><mml:mrow><mml:mi>&#x003C4;</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mi>r</mml:mi><mml:mi>a</mml:mi><mml:mi>v</mml:mi><mml:mi>e</mml:mi><mml:mi>l</mml:mi></mml:mrow></mml:msubsup></mml:math></inline-formula> represents the routing time following the allocation of anti-epidemic resources. Assuming a constant speed, <inline-formula><mml:math id="M16"><mml:msubsup><mml:mrow><mml:mi>&#x003C4;</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mi>r</mml:mi><mml:mi>a</mml:mi><mml:mi>v</mml:mi><mml:mi>e</mml:mi><mml:mi>l</mml:mi></mml:mrow></mml:msubsup></mml:math></inline-formula> is determined by the distance between the supplier and the recipient.</p>
<p>The average wait time <italic>avg</italic><sub>&#x003C4;</sub> is the ratio of the total waiting time for matching to the number of requests made by all recipients within the matching time window. It can be calculated by the <xref ref-type="disp-formula" rid="EQ10">Equation 10</xref>.</p>
<disp-formula id="EQ10"><mml:math id="M17"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mi>a</mml:mi><mml:mi>v</mml:mi><mml:msub><mml:mrow><mml:mi>g</mml:mi></mml:mrow><mml:mrow><mml:mi>&#x003C4;</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:msub><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>&#x02208;</mml:mo><mml:mi>M</mml:mi></mml:mrow></mml:msub><mml:msub><mml:mrow><mml:mi>&#x003C4;</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mrow><mml:mo>|</mml:mo><mml:mi>M</mml:mi><mml:mo>|</mml:mo></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(10)</label></disp-formula>
<p>The average match rate <italic>avg</italic><sub><italic>rate</italic></sub> is the ratio of the total completion rates of all recipients to the number of recipients within the specified matching time window. The average match rate can be calculated using <xref ref-type="disp-formula" rid="EQ11">Equation 11</xref>.</p>
<disp-formula id="EQ11"><mml:math id="M18"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mi>a</mml:mi><mml:mi>v</mml:mi><mml:msub><mml:mrow><mml:mi>g</mml:mi></mml:mrow><mml:mrow><mml:mi>r</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>e</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:msub><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>&#x02208;</mml:mo><mml:mi>M</mml:mi></mml:mrow></mml:msub><mml:msub><mml:mrow><mml:mi>r</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mrow><mml:mo>|</mml:mo><mml:mi>M</mml:mi><mml:mo>|</mml:mo></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(11)</label></disp-formula>
<p>Where |<bold><italic>M</italic></bold>| indicates the total number of recipient <italic>i</italic> which participate in <italic>t</italic>; <italic>r</italic><sub><italic>i</italic></sub>(<italic>t</italic>) indicates the matching completion rate of the recipient <italic>i</italic> which participate in <italic>t</italic>, as shown in <xref ref-type="disp-formula" rid="EQ2">Equation 12</xref>.</p>
<disp-formula id="EQ12"><mml:math id="M19"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>r</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:msub><mml:mrow><mml:mi>q</mml:mi></mml:mrow><mml:mrow><mml:mi>m</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>c</mml:mi><mml:mi>h</mml:mi><mml:mi>e</mml:mi><mml:mi>d</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>q</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(12)</label></disp-formula></sec></sec>
<sec id="s4">
<title>Methods</title>
<sec>
<title>Matching time window selection</title>
<p>Choosing the appropriate matching time window significantly influences the waiting time experienced by resource recipients. There are two primary types of matching time windows: instant matching and batch matching (<xref ref-type="bibr" rid="B25">25</xref>). While instant matching can minimize individual waiting times, it may not always be the most optimal solution. Conversely, batch matching enhances the overall matching efficiency of the HIS platform (<xref ref-type="bibr" rid="B11">11</xref>). The size of the batch matching time window is also crucial. This study examines the <italic>fixed time window batch matching strategy</italic> (FTWBM) and the <italic>adaptive time window batch matching strategy</italic> (ATWBM).</p>
<p>In the FTWBM strategy, both the recipient and the supplier arrive randomly at the HIS platform over a time series. During a specified time period <bold><italic>T</italic></bold>, the HIS platform divides this period into <italic>n</italic> matching time windows of equal duration (<italic>t</italic><sub>1</sub>, <italic>t</italic><sub>2</sub>, &#x022EF;, <italic>t</italic><sub><italic>n</italic></sub>). The size of each matching time window is <italic>bs</italic>. The HIS platform collects requests from recipients and suppliers within each matching time window and organizes resource matching at the conclusion of the window. For instance, if the time period is set to 24 h (<italic>T</italic> &#x0003D; 24h) and the matching time window is 10 min (<italic>bs</italic> &#x0003D; 10), a total of 144 fixed matching time windows can be generated. This implies that 144 resource matching tasks must be executed within a single day. Simultaneously, the HIS platform seeks to maximize the match within each time window.</p>
<p>Unlike the FTWBM, the ATWBM minimizes waiting time by automatically selecting a series of matching window sizes based on a specific strategy. The HIS platform also divides the time period <bold><italic>T</italic> </bold>into <italic>n</italic> matching time windows (<italic>t</italic><sub>1</sub>, <italic>t</italic><sub>2</sub>, &#x022EF;, <italic>t</italic><sub><italic>n</italic></sub>), although the sizes of these windows may vary. Before each match begins, the HIS platform continues to gather requests from both recipients and suppliers to create a matching task set. Once the matching process is complete, the successfully matched recipients and suppliers are removed from their respective sets. In the subsequent matching time window, new requests from recipients and suppliers may arrive, or some recipients and suppliers may depart. Consequently, the recipient set <bold><italic>D</italic> </bold>and the supplier set <bold><italic>S</italic> </bold>are updated. The ATWBM dynamically selects an appropriate matching time window based on the feedback reward.</p></sec>
<sec>
<title>Markov decision process for matching</title>
<p>The HIS platform utilizes batch matching, which allows resource suppliers and recipients to wait for a specified period. This process can be modeled as a Markov decision process. In this framework, the agent continuously interacts with the environment, receiving the current state from it at time <italic>t</italic>. Based on this state, the agent selects an action <italic>A</italic>, which then influences the environment, resulting in a reward <italic>R</italic><sub><italic>t</italic></sub> and a new state being returned to the agent. The Markov sequence stipulates that the generation of the next state depends solely on the current state. Specifically, when new suppliers or recipients arrive, two states&#x02014;holding and matching&#x02014;can be adopted. The action involves selecting a matching time window. Once the matching time window is determined, a matching timestamp <italic>t</italic> is generated, allowing the matching action to proceed. If <italic>requesttime</italic><sub><italic>i</italic></sub>&#x0003C;<italic>t</italic> and the matching state is not a complete match (<italic>rate</italic><sub><italic>i</italic></sub> &#x0003C; 1), the recipient <italic>i</italic> is included in the recipient set <bold><italic>D</italic></bold><sub><bold><italic>t</italic></bold></sub>. If <italic>requesttime</italic><sub><italic>j</italic></sub>&#x0003C;<italic>t</italic> and the matching state is not a complete match (<italic>rate</italic><sub><italic>j</italic></sub> &#x0003C; 1), the supplier <italic>j</italic> is included in the supplier set <bold><italic>S</italic></bold><sub><bold><italic>t</italic></bold></sub>. Those that do not meet the matching conditions will remain holding in the buffer (see <xref ref-type="supplementary-material" rid="SM1">Supplementary Figure S1</xref>). Meanwhile, the elements in the recipient and supplier sets are sorted according to time, respectively.</p></sec>
<sec>
<title>Reinforcement learning-based adaptive time window batch matching</title>
<p>This study addresses the problem of Markov decision processes with batch matching by employing reinforcement learning to select adaptive time window sizes. Reinforcement learning involves mapping the relationship between learning states and behaviors, focusing on how to make decisions under uncertain conditions to maximize benefits (<xref ref-type="bibr" rid="B26">26</xref>). The multi-armed bandit (MAB) problem is a classic reinforcement learning challenge in which a system contains k arms, each yielding a different reward when selected. Decision-makers initially lack knowledge of the rewards associated with each action but gradually accumulate information through interactions with the system over a time period <bold><italic>T</italic></bold>. The objective of the decision-maker is to maximize total revenue within <bold><italic>T</italic></bold>. Exploration and exploitation are two fundamental concepts in reinforcement learning. Exploration refers to the strategy of trying various actions to discover the maximum reward, while exploitation involves selecting an action that is known to yield a substantial reward. The MAB framework gathers information by exploring different actions and uses it to maximize rewards through exploration-exploitation trade-offs. Additionally, the MAB is a key component of stochastic scheduling and is widely applied in fields such as online advertising, recommendation systems, and crowdsourcing tasks (<xref ref-type="bibr" rid="B27">27</xref>).</p>
<p>Adaptive time window batch matching addresses the mechanism of dividing matching time windows within a model to achieve the optimization goal of maximizing matches while minimizing waiting time. Since the rewards associated with specific matching time windows are not known in advance, the HIS platform interacts with the environment through exploration and exploitation strategies. Candidate matching sets are formed by selecting various batch matching time windows, after which the performance of the current state is observed, allowing for dynamic adjustments in subsequent selections. Through this process, the matching time window that yields the best performance is identified and selected to optimize the average waiting time. The MAB algorithm can be employed to solve these types of sequential decision-making problems. The division of matching time windows can be modeled as an MDP, where the current state and actions directly influence the next state. The primary challenge lies in selecting the appropriate matching window at the optimal time to maximize benefits. <xref ref-type="disp-formula" rid="EQ13">Equation 13</xref> utilizes the average waiting time <italic>R</italic><sub><italic>t</italic></sub>(<italic>a</italic>) of the matching time window <italic>t</italic> to calculate a score and update it accordingly.</p>
<disp-formula id="EQ13"><mml:math id="M20"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>R</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>a</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:msub><mml:mrow><mml:mi>a</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>&#x0002B;</mml:mo><mml:msub><mml:mrow><mml:mi>a</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:mrow></mml:msub><mml:mo>&#x0002B;</mml:mo><mml:mo>&#x022EF;</mml:mo><mml:mo>&#x0002B;</mml:mo><mml:msub><mml:mrow><mml:mi>a</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:mi>c</mml:mi></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(13)</label></disp-formula>
<p>Where <italic>a</italic><sub><italic>ic</italic></sub> indicates the average waiting time of the matching time window <italic>t</italic> for the <italic>c</italic>-th selection; <italic>c</italic> indicates the total number of times the matching time window <italic>t</italic> has been selected.</p>
<p>This study selects the matching time window based on the classic &#x003B5;-greedy algorithm (<xref ref-type="bibr" rid="B26">26</xref>). The sizes of the matching time window set <italic>A</italic> &#x0003D; {<italic>bs</italic><sub>1</sub>, <italic>bs</italic><sub>2</sub>, &#x022EF;, <italic>bs</italic><sub><italic>k</italic></sub>} are utilized as the k-arms of MAB. As illustrated in <xref ref-type="other" rid="algorithm_1">Algorithm 1</xref>, a matching time window <italic>t</italic><sub><italic>i</italic></sub> is randomly selected with the probability of &#x003B5;(0 &#x0003C; &#x003B5; &#x0003C; 1) to explore, while the time window with the highest current reward is chosen to exploit with a probability of 1&#x02212;&#x003B5;. Whenever the matching of <italic>t</italic><sub><italic>i</italic></sub> ends, the revenue of <italic>t</italic><sub><italic>i</italic></sub> is updated. To facilitate the rapid learning of the online version, this study introduces a continuous policy improvement interval <italic>K</italic><sub>&#x003B8;</sub> and the decay coefficient &#x003BB; &#x02208; (0, 1) of &#x003B5;<sub><italic>k</italic></sub>. When <italic>K</italic><sub>&#x003B8;</sub> &#x0003D; 0, each time the online algorithm performs a match, the matching time window is updated to initiate a new round of matching, which is entirely optimistic (<xref ref-type="bibr" rid="B28">28</xref>). When <italic>K</italic><sub>&#x003B8;</sub>&#x0003E;1, the algorithm executes several matches using the current strategy before refining it, which is considered partially optimistic. Furthermore, as the number of matches increases, &#x003B5;<sub><italic>k</italic></sub> typically decreases. The algorithm will employ the current strategy with a higher probability (<xref ref-type="bibr" rid="B29">29</xref>). Consequently, <xref ref-type="disp-formula" rid="EQ14">Equation 14</xref> establishes the initial exploration probability &#x003B5;<sub>0</sub>, and each match decays exponentially according to the decay rate &#x003BB;.</p>
<disp-formula id="EQ14"><mml:math id="M21"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B5;</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mrow><mml:mi>&#x003B5;</mml:mi></mml:mrow><mml:mrow><mml:mn>0</mml:mn></mml:mrow></mml:msub><mml:msup><mml:mrow><mml:mi>&#x003BB;</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msup></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(14)</label></disp-formula>
<statement content-type="algorithm" id="algorithm_1">
<label>Algorithm 1</label>
<p>Adaptive time window batch bipartite matching algorithm.
<preformat>
<bold>Input:</bold> the sizes of time window batch set <italic><bold>BS</bold></italic>, the timestamp set <italic><bold>TS</bold></italic>, policy improvement interval, the exploration coefficient, the decay coefficient &#x003BB;.
<bold>Output:</bold>
The maximum matching set <italic><bold>M</bold></italic>, the average waiting time set <italic><bold>AT</bold></italic>, and the average matching rate <italic><bold>RT</bold></italic>.
<bold>Algorithm</bold>
1: <italic>R</italic>&#x02190;[0for<italic>bs</italic>in<bold><italic>A</italic></bold>] 
2: &#x003C9;&#x02190;0, initialize time window batch <italic>bs</italic><sub>0</sub> 
3: for <italic>k</italic> &#x0003D; 1, 2, &#x022EF;&#x02009; do: 
4: if <italic>random</italic>(0, 1) &#x02264; &#x003B5;<sub><italic>k</italic></sub> then 
5: <italic>bs</italic>&#x02190;<italic>random choice</italic>(<italic>BS</italic>) 
6: else 
7: <italic>bs</italic>&#x02190;<italic>bs</italic><sub>&#x003C9;</sub> 
8: end if 
9: set the match timestamp as <italic>ts</italic> 
10: get recipients set <italic><bold>D</bold></italic> and suppliers set <italic><bold>S</bold></italic> smaller than the current timestamp and the matching status &#x0003C; 1 respectively 
11: do Algorithm 2 
12: calculate<italic>R</italic><sub><italic>t</italic></sub> 
13: <italic>R</italic>[<italic>bs</italic>]&#x02190;<italic>R</italic><sub><italic>t</italic></sub> 
14: if <italic>k</italic> &#x0003D; =(&#x003C9;&#x0002B;1)<italic>K</italic><sub>&#x003B8;</sub> then 
15: <italic>bs</italic><sub>&#x003C9;&#x0002B;1</sub>&#x02190;<italic>A</italic>[min(<italic>R</italic>)] 
16: &#x003C9;&#x02190;&#x003C9;&#x0002B;1 
17: end if 
18: end for
</preformat>
</p>
</statement>
</sec>
<sec>
<title>Nearest neighbor first-based bipartite matching</title>
<p>The supply-demand bipartite matching network is based on the service radius of suppliers. <xref ref-type="disp-formula" rid="EQ4">Equation 4</xref> demonstrates that each supplier <italic>j</italic> is constrained by their service scope, with the maximum service scope being defined as <italic>l</italic><sub><italic>j</italic></sub>. In the bipartite network <italic>G</italic>&#x0003C;<italic>U, V, E</italic>(<italic>U, V</italic>)&#x0003E; consisting of suppliers and recipients, where <italic>U</italic> &#x0003D; <bold><italic>D</italic></bold><sub><italic>t</italic></sub>, and <italic>V</italic> &#x0003D; <bold><italic>S</italic></bold><sub><italic>t</italic></sub>, calculate Manhattan distance <italic>l</italic><sub><italic>ij</italic></sub> between the recipient <italic>i</italic> and the supplier <italic>j</italic>. According to the <xref ref-type="disp-formula" rid="EQ4">Equation 4</xref>, if <italic>l</italic><sub><italic>ij</italic></sub> &#x02264; <italic>l</italic><sub><italic>j</italic></sub>, there is an edge between <italic>i</italic> and <italic>j</italic>, and the distance is used as the weight of the edge, that is, <italic>E</italic>(<italic>i, j</italic>) &#x0003D; <italic>l</italic><sub><italic>ij</italic></sub>. if <italic>l</italic><sub><italic>ij</italic></sub>&#x0003E;<italic>l</italic><sub><italic>j</italic></sub>, there is no match between <italic>i</italic> and <italic>j</italic>, and set <italic>E</italic>(<italic>i, j</italic>) &#x0003D; &#x02212;1.</p>
<p>The nearest neighbor first (NNF) strategy considers the distance between suppliers and recipients by incorporating distance-based priority matching constraints. <xref ref-type="disp-formula" rid="EQ15">Equation 15</xref> prioritizes the allocation of anti-epidemic resources from suppliers to recipients that are closer in proximity, thereby maximizing matching while minimizing <inline-formula><mml:math id="M22"><mml:msubsup><mml:mrow><mml:mi>&#x003C4;</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mi>r</mml:mi><mml:mi>a</mml:mi><mml:mi>v</mml:mi><mml:mi>e</mml:mi><mml:mi>l</mml:mi></mml:mrow></mml:msubsup></mml:math></inline-formula>. Let <italic>L</italic><sub><italic>i</italic></sub> represent a set of <italic>l</italic><sub><italic>ij</italic></sub>, which includes all suppliers that can be matched with recipients. Select min(<italic>l</italic><sub><italic>ij</italic></sub>) as the prioritized matching for recipients (see <xref ref-type="supplementary-material" rid="SM1">Supplementary Figure S2</xref>).</p>
<disp-formula id="EQ15"><mml:math id="M23"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mstyle displaystyle="true"><mml:munderover accentunder="false" accent="false"><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mstyle mathvariant="bold-italic"><mml:mi>D</mml:mi></mml:mstyle></mml:mrow></mml:munderover></mml:mstyle><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:msub><mml:mrow><mml:mi>q</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mn>0</mml:mn><mml:mo>,</mml:mo><mml:mtext>&#x000A0;</mml:mtext><mml:mo>&#x02200;</mml:mo><mml:msub><mml:mrow><mml:mi>l</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:msup><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mi>&#x02032;</mml:mi></mml:mrow></mml:msup></mml:mrow></mml:msub><mml:mo>&#x0003C;</mml:mo><mml:msub><mml:mrow><mml:mi>l</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(15)</label></disp-formula>
<p>Multi-stage bipartite graph matching is predicated on the priorities of suppliers and recipients. Based on the recipient&#x00027;s anti-epidemic priority attribute <italic>dr</italic> and <xref ref-type="disp-formula" rid="EQ5">Equation 5</xref>, the bipartite network <italic>G</italic>&#x0003C;<italic>U, V, E</italic>(<italic>U, V</italic>)&#x0003E; is partitioned into <italic>G</italic><sub><italic>PH</italic></sub>&#x0003C;<italic>U, V, E</italic>(<italic>U, V</italic>)&#x0003E; with high-priority recipients, and <italic>G</italic><sub><italic>PL</italic></sub>&#x0003C;<italic>U, V, E</italic>(<italic>U, V</italic>)&#x0003E;with low-priority recipients (see <xref ref-type="supplementary-material" rid="SM1">Supplementary Figure S3</xref>). Subsequently, <italic>G</italic><sub><italic>PH</italic></sub>&#x0003C;<italic>U, V, E</italic>(<italic>U, V</italic>)&#x0003E; and <italic>G</italic><sub><italic>PL</italic></sub>&#x0003C;<italic>U, V, E</italic>(<italic>U, V</italic>)&#x0003E; are divided into three stages according to the supplier&#x00027;s level <italic>sr</italic> &#x0003D; { 1, 2, 3 } , respectively (see <xref ref-type="supplementary-material" rid="SM1">Supplementary Figure S4</xref>). As shown in <xref ref-type="other" rid="algorithm_2">Algorithm 2</xref>, the set <bold><italic>U</italic> </bold>matches the set <bold><italic>V</italic> </bold>with <italic>sr</italic> &#x0003D; 1 in the first stage. If the matching is not fully completed, the second stage of matching is performed, wherein set <bold><italic>U</italic> </bold>matches set <bold><italic>V</italic> </bold>with <italic>sr</italic> &#x0003D; 2. Similarly, the third stage of matching is conducted until the matching is successfully completed. If, at any stage, set <bold><italic>U</italic> </bold>completes matching, the process is terminated.</p>
<statement content-type="algorithm" id="algorithm_2">
<label>Algorithm 2</label>
<p>Service-level-based multi-stage matching algorithm (G-HMBMC).
<preformat>
<bold>Input:</bold>
G &#x0003C; U,V,E(U,V)&#x0003E;
<bold>Algorithm</bold>
1: <italic>SR</italic> &#x0003D; {1, 2, 3} 
2: for <italic>sr</italic> &#x02208; <italic>SR</italic> do: 
3: <italic>V</italic><sub><italic>sr</italic></sub>&#x02190;<italic>j</italic>, for <italic>j</italic> in <italic>V</italic> and <italic>j</italic><sub><italic>sr</italic></sub> &#x0003D; <italic>sr</italic> 
4: if <italic>G</italic><sub><italic>PH</italic></sub>&#x0003C;<italic>U, V, E</italic>(<italic>U, V</italic>)&#x0003E;then 
5: do GMBMC algorithm 
6: else 
7: do HMBMC algorithm 
8: end if 
9: if <italic>U</italic> &#x0003D; =&#x02205; then 
10: break 
11: end if 
12: end for
</preformat>
</p>
</statement>
<p>Prioritizing the allocation of resources to areas that have been significantly impacted by the epidemic can aid in containing outbreaks within these areas and in preventing further transmission. In the process of matching anti-epidemic resources, recipients with higher priority levels are given precedence in the matching procedure. The Greedy-based many-to-many bipartite matching algorithm with capacity (see <xref ref-type="supplementary-material" rid="SM1">Algorithm S1</xref>) operates under the assumption that the current high-priority recipient will consistently be matched with the most advantageous supplier, irrespective of the matching decisions made by other recipients.</p>
<p>For the set of recipients with low priority, the maximum matching is determined using the classic Hungarian algorithm, a combinatorial optimization algorithm for solving task allocation problems in polynomial time. This algorithm identifies the maximum matching by continuously locating augmenting paths to increase the number of matching edges and vertices. It effectively addresses task allocation challenges to optimize resource utilization and is widely applied across various fields involving resource matching problems. The classic Hungarian algorithm primarily addresses assignments involving a single task or resource, without accounting for capacity constraints. Conversely, the allocation of anti-epidemic resources must consider the quantity of resources allocated, presenting a matching problem with capacity limitations. Therefore, this study incorporates capacity attributes into the vertices of bipartite graph networks (see <xref ref-type="supplementary-material" rid="SM1">Algorithm S2</xref>) and defines a recursive function <italic>getPath</italic>(<italic>i, q</italic><sub><italic>i</italic></sub>) to identify augmenting paths. Additionally, the classic Hungarian algorithm is designed to solve one-to-one matching problems. However, there exists a mismatch of anti-epidemic resources between recipients and suppliers, resulting in a many-to-many matching problem. Consequently, it is essential to extend the classic Hungarian algorithm to accommodate many-to-many matching, which can be achieved by enhancing the augmenting path search mechanism.</p></sec></sec>
<sec id="s5">
<title>Experimental analysis</title>
<sec>
<title>Experimental setup</title>
<p>This study delineates the findings of an experiment conducted utilizing the proposed algorithm on synthetic datasets. The decision period is established at |<bold><italic>T</italic></bold>| &#x0003D; 120. Within this timeframe, recipient requests and supplier resources are introduced randomly in chronological order, generating corresponding data based on the characteristics of both resource recipients and suppliers. The anti-epidemic level (<italic>dr</italic> &#x0003D; {<italic>high, low</italic>}) of the recipients is randomly assigned in accordance with the demand response, while the suppliers&#x00027; levels (<italic>sr</italic> &#x0003D; {1, 2, 3}) are generated randomly based on the supply response. In consideration of the availability of anti-epidemic resources, the ratio of the quantity of resources requested by the recipient to those supplied by the supplier is approximately set at 0.8. A total of 3,000 sets of recipient requests and 1,800 sets of supplier resources are generated randomly.</p>
<p>The FTWBM experiment selects any matching time window from the <bold><italic>BS</italic></bold> for testing, while the ATWBM experiment randomly selects a matching time window <italic>t</italic> with a probability of &#x003B5;<sub><italic>k</italic></sub> for exploration. The remaining time window is then selected for exploitation with a probability of 1&#x02212;&#x003B5;<sub><italic>k</italic></sub>. To facilitate rapid learning in the online version, <xref ref-type="table" rid="T1">Table 1</xref> establishes the decay coefficient &#x003BB; for &#x003B5;<sub><italic>k</italic></sub> and the continuous strategy improvement intervals <italic>K</italic><sub>&#x003B8;</sub>.</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>Experimental parameter settings.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left"><bold>Parameters</bold></th>
<th valign="top" align="center"><bold>Values</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">|<bold><italic>T</italic></bold>|</td>
<td valign="top" align="center">120</td>
</tr>
<tr>
<td valign="top" align="left">|<bold><italic>D</italic></bold>|</td>
<td valign="top" align="center">3,000</td>
</tr>
<tr>
<td valign="top" align="left">|<bold><italic>S</italic></bold>|</td>
<td valign="top" align="center">1,800</td>
</tr>
<tr>
<td valign="top" align="left">BS</td>
<td valign="top" align="center">{1,2,3,4,6,8}</td>
</tr>
<tr>
<td valign="top" align="left">&#x003B5;<sub>0</sub></td>
<td valign="top" align="center">{0.02, 0.2,0.8}</td>
</tr>
<tr>
<td valign="top" align="left"><italic>K</italic><sub>&#x003B8;</sub></td>
<td valign="top" align="center">{0,2}</td>
</tr>
<tr>
<td valign="top" align="left">&#x003BB;</td>
<td valign="top" align="center">{0.2,0.8}</td>
</tr></tbody>
</table>
</table-wrap></sec>
<sec>
<title>Experimental results</title>
<sec>
<title>Impact of fixed batch size on the matching time window</title>
<p><xref ref-type="fig" rid="F2">Figure 2</xref> illustrates the average matching rate and average waiting time for anti-epidemic resources under fixed matching time windows with varying batch sizes. As batch size increases from 1 to 8, the average match rate shows a clear upward trend, with median values rising from approximately 0.5 to 0.89, indicating improved matching efficiency at larger batch sizes. The instant matching result (<italic>bs</italic> &#x0003D; 1) is inferior to the delayed batch matching across other fixed time windows in terms of average matching rate. Conversely, the average waiting time initially decreases, then rises after exceeding a certain threshold. The average waiting time gradually decreases from <italic>bs</italic> &#x0003D; 1 to <italic>bs</italic> &#x0003D; 4, after which it begins to rise (from <italic>bs</italic> &#x0003D; 4 to <italic>bs</italic> &#x0003D; 8). Indeed, <italic>bs</italic> &#x0003D; 4 strikes a balance between average waiting time and matching rate, making it an optimal choice for a fixed batch matching time window. It facilitates a reasonable waiting time while achieving a satisfactory matching rate. The result demonstrates that increasing batch size enhances matching efficiency but risks increasing waiting time variability. While larger batches yield higher match rates, they do not consistently reduce waiting time and may even worsen it due to aggregation delays. Therefore, batch size should be carefully tuned to achieve the best balance between matching performance and user experience. It is particularly important to dynamically adjust the batch size through an adaptive batching strategy.</p>
<fig position="float" id="F2">
<label>Figure 2</label>
<caption><p>Results across batch sizes (bs). <bold>Left</bold>: Average match rate; <bold>Right</bold>: Average waiting time. Each boxplot shows median (red line), interquartile range (box), whiskers (1.5 &#x000D7; IQR), outliers (circles), and mean (green diamond).</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpubh-13-1644499-g0002.tif">
<alt-text content-type="machine-generated">Two box plot charts side by side. The left chart shows the average hit rate for different batch sizes (bs-1 to bs-8), with values generally increasing. The right chart displays average waiting time for the same batch sizes, where values decrease initially and stabilize with some outliers, especially for batch size bs-4 and beyond. Each box plot includes mean (green diamond), median (red line), and variability indicators.</alt-text>
</graphic>
</fig>
<p>From a statistical perspective, <xref ref-type="table" rid="T2">Table 2</xref> reveals a clear and statistically significant improvement in average match rate (AR) with increasing batch size (<italic>bs</italic>), as evidenced by non-overlapping 95% confidence intervals across all conditions, indicating consistent and reliable gains. Conversely, while average waiting time (AT) increases monotonically, the substantial overlap between 95% CIs suggests that most pairwise differences are not statistically significant. This highlights a trade-off where higher matching efficiency comes at the cost of longer delays, but only marginally so until larger batches. Notably, the precision of AR estimates remains high due to narrow CIs and low standard errors, whereas AT estimates become less reliable as sample sizes decrease, reflected in wider CIs. Overall, the data support a strong positive effect of batch size on matching performance with high statistical credibility, while the impact on waiting time is less certain. <italic>bs</italic> &#x0003D; 4 emerges as an optimal balance, achieving high AR (77.0%, 95% CI [0.706, 0.834]) with minimal delay increase (11.64 min, 95% CI [10.501, 12.777]) and sufficient statistical precision.</p>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p>Statistical results of average match rate and average waiting time across different batch sizes (<italic>bs</italic>).</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th/>
<th valign="top" align="center" colspan="6"><bold>The average match rate (AR)</bold></th>
<th valign="top" align="center" colspan="6"><bold>The average waiting time (AT)</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td/>
<td valign="top" align="center"><italic><bold>bs</bold></italic> = <bold>1</bold></td>
<td valign="top" align="center"><italic><bold>bs</bold></italic> = <bold>2</bold></td>
<td valign="top" align="center"><italic><bold>bs</bold></italic> = <bold>3</bold></td>
<td valign="top" align="center"><italic><bold>bs</bold></italic> = <bold>4</bold></td>
<td valign="top" align="center"><italic><bold>bs</bold></italic> = <bold>6</bold></td>
<td valign="top" align="center"><italic><bold>bs</bold></italic> = <bold>8</bold></td>
<td valign="top" align="center"><italic><bold>bs</bold></italic> = <bold>1</bold></td>
<td valign="top" align="center"><italic><bold>bs</bold></italic> = <bold>2</bold></td>
<td valign="top" align="center"><italic><bold>bs</bold></italic> = <bold>3</bold></td>
<td valign="top" align="center"><italic><bold>bs</bold></italic> = <bold>4</bold></td>
<td valign="top" align="center"><italic><bold>bs</bold></italic> = <bold>6</bold></td>
<td valign="top" align="center"><italic><bold>bs</bold></italic> = <bold>8</bold></td>
</tr>
<tr>
<td valign="top" align="left">n</td>
<td valign="top" align="center">120</td>
<td valign="top" align="center">60</td>
<td valign="top" align="center">40</td>
<td valign="top" align="center">30</td>
<td valign="top" align="center">20</td>
<td valign="top" align="center">15</td>
<td valign="top" align="center">120</td>
<td valign="top" align="center">60</td>
<td valign="top" align="center">40</td>
<td valign="top" align="center">30</td>
<td valign="top" align="center">20</td>
<td valign="top" align="center">15</td>
</tr>
<tr>
<td valign="top" align="left"><italic>median</italic></td>
<td valign="top" align="center">0.486</td>
<td valign="top" align="center">0.684</td>
<td valign="top" align="center">0.757</td>
<td valign="top" align="center">0.819</td>
<td valign="top" align="center">0.889</td>
<td valign="top" align="center">0.890</td>
<td valign="top" align="center">11.325</td>
<td valign="top" align="center">11.507</td>
<td valign="top" align="center">11.675</td>
<td valign="top" align="center">11.153</td>
<td valign="top" align="center">12.039</td>
<td valign="top" align="center">13.213</td>
</tr>
<tr>
<td valign="top" align="left"><italic><inline-formula><mml:math id="M24"><mml:mover accent="true"><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mo>&#x00304;</mml:mo></mml:mover></mml:math></inline-formula></italic></td>
<td valign="top" align="center">0.500</td>
<td valign="top" align="center">0.654</td>
<td valign="top" align="center">0.711</td>
<td valign="top" align="center">0.770</td>
<td valign="top" align="center">0.828</td>
<td valign="top" align="center">0.859</td>
<td valign="top" align="center">11.310</td>
<td valign="top" align="center">11.516</td>
<td valign="top" align="center">11.862</td>
<td valign="top" align="center">11.639</td>
<td valign="top" align="center">12.520</td>
<td valign="top" align="center">13.330</td>
</tr>
<tr>
<td valign="top" align="left"><italic>s</italic></td>
<td valign="top" align="center">0.248</td>
<td valign="top" align="center">0.220</td>
<td valign="top" align="center">0.195</td>
<td valign="top" align="center">0.172</td>
<td valign="top" align="center">0.145</td>
<td valign="top" align="center">0.119</td>
<td valign="top" align="center">3.803</td>
<td valign="top" align="center">3.411</td>
<td valign="top" align="center">3.344</td>
<td valign="top" align="center">3.048</td>
<td valign="top" align="center">2.830</td>
<td valign="top" align="center">2.616</td>
</tr>
<tr>
<td valign="top" align="left">SE</td>
<td valign="top" align="center">0.023</td>
<td valign="top" align="center">0.028</td>
<td valign="top" align="center">0.031</td>
<td valign="top" align="center">0.031</td>
<td valign="top" align="center">0.033</td>
<td valign="top" align="center">0.031</td>
<td valign="top" align="center">0.347</td>
<td valign="top" align="center">0.440</td>
<td valign="top" align="center">0.529</td>
<td valign="top" align="center">0.556</td>
<td valign="top" align="center">0.633</td>
<td valign="top" align="center">0.675</td>
</tr>
<tr>
<td valign="top" align="left">ME</td>
<td valign="top" align="center">0.045</td>
<td valign="top" align="center">0.057</td>
<td valign="top" align="center">0.062</td>
<td valign="top" align="center">0.064</td>
<td valign="top" align="center">0.068</td>
<td valign="top" align="center">0.066</td>
<td valign="top" align="center">0.687</td>
<td valign="top" align="center">0.881</td>
<td valign="top" align="center">1.069</td>
<td valign="top" align="center">1.138</td>
<td valign="top" align="center">1.325</td>
<td valign="top" align="center">1.448</td>
</tr>
<tr>
<td valign="top" align="left">95% CI</td>
<td valign="top" align="center">[0.456, 0.545]</td>
<td valign="top" align="center">[0.597, 0.711]</td>
<td valign="top" align="center">[0.649, 0.773]</td>
<td valign="top" align="center">[0.706, 0.834]</td>
<td valign="top" align="center">[0.760, 0.896]</td>
<td valign="top" align="center">[0.793, 0.925]</td>
<td valign="top" align="center">[10.622, 11.997]</td>
<td valign="top" align="center">[10.635, 12.397]</td>
<td valign="top" align="center">[10.792, 12.931]</td>
<td valign="top" align="center">[10.501, 12.777]</td>
<td valign="top" align="center">[11.196, 13.845]</td>
<td valign="top" align="center">[11.882, 14.779]</td>
</tr></tbody>
</table>
</table-wrap>
</sec>
<sec>
<title>Impact of adaptive batch sizes on the matching time window</title>
<p>In the context of online matching for anti-epidemic resources utilizing the ATWBM strategy, this study enhances the effectiveness of the G-HMBMC algorithm by dynamically selecting the matching time window through control parameters (see <xref ref-type="supplementary-material" rid="SM1">Supplementary Figure S5</xref>): initial exploration probability &#x003B5;<sub>0</sub>, strategy improvement interval <italic>K</italic><sub>&#x003B8;</sub> and attenuation coefficient &#x003BB; of &#x003B5;<sub><italic>k</italic></sub>. The subsequent sections discuss the impact of these parameters on the matching results.</p>
<p><xref ref-type="fig" rid="F3">Figure 3</xref> illustrates the effect of the attenuation coefficient &#x003BB; on the matching results. The data indicate that, in most instances, the matching results under partially optimistic scenarios are superior to those observed in fully optimistic scenarios. In the fully optimistic scenario with <italic>K</italic><sub>&#x003B8;</sub> &#x0003D; 0, when the attenuation coefficient is low (&#x003BB; &#x0003D; 0.2), a larger initial exploration probability (&#x003B5;<sub>0</sub> &#x0003D; 0.8) can yield improved matching results, as shown in <xref ref-type="fig" rid="F3">Figure 3a</xref>. Conversely, when a larger attenuation coefficient (&#x003BB; &#x0003D; 0.8) is employed, a smaller initial exploration probability (&#x003B5;<sub>0</sub> &#x0003D; 0.1,&#x003B5;<sub>0</sub> &#x0003D; 0.02) can yield improved matching results, as shown in <xref ref-type="fig" rid="F3">Figure 3b</xref>. In the scenario of partial optimism with <italic>K</italic><sub>&#x003B8;</sub> &#x0003D; 2, when the attenuation coefficient is low (&#x003BB; &#x0003D; 0.2), the selection of the attenuation coefficient (&#x003B5;<sub>0</sub>) does not significantly influence the matching outcomes, as demonstrated in <xref ref-type="fig" rid="F3">Figure 3c</xref>. However, when the attenuation coefficient is high (&#x003BB; &#x0003D; 0.8), a smaller initial exploration probability (&#x003B5;<sub>0</sub> &#x0003D; 0.1,&#x003B5;<sub>0</sub> &#x0003D; 0.02) facilitates the exploration of better matching time windows, leading to improved matching results, as shown in <xref ref-type="fig" rid="F3">Figure 3d</xref>. The result indicates that with a low attenuation coefficient, the algorithm can maintain a larger exploration space to identify better matching strategies. Conversely, with a low initial exploration probability, the algorithm tends to prioritize the current optimal strategy and neglect exploration, potentially missing the opportunity to discover the optimal matching strategy. In particular, the application of a fully optimistic strategy with a small attenuation coefficient and a partially optimistic strategy with a small attenuation coefficient both produce favorable matching results. These findings underscore the critical importance of maintaining an appropriate level of exploration to achieve improved matching outcomes.</p>
<fig position="float" id="F3">
<label>Figure 3</label>
<caption><p>Impact of the initial exploration probability &#x003B5;<sub>0</sub> on the matching result. Each boxplot shows median (red line), interquartile range (box), whiskers (1.5 &#x000D7; IQR), outliers (circles), and mean (green diamond). <bold>(a)</bold> Result on self-adaptive batch size (<italic>K</italic> = 0, &#x003BB; = 0.2). <bold>(b)</bold> Result on self-adaptive batch size (<italic>K</italic> = 0, &#x003BB; = 0.8). <bold>(c)</bold> Result on self-adaptive batch size (<italic>K</italic> = 2, &#x003BB; = 0.2). <bold>(d)</bold> Result on self-adaptive batch size (<italic>K</italic> = 2, &#x003BB; = 0.8).</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpubh-13-1644499-g0003.tif">
<alt-text content-type="machine-generated">Box plots showing results on self-adaptive batch sizes for different values (0.02, 0.1, 0.8) and parameters K and L. The y-axes represent average measure values. Panels (a) and (c) are with k = 0, = 0.2 and K = 2, = 0.2 respectively, while panels (b) and (d) use K = 0, = 0.8 and K = 2, = 0.8 respectively. Box plots display the distribution and variation in scores with marked mean values and potential outliers.</alt-text>
</graphic>
</fig></sec></sec>
<sec>
<title>Discussion</title>
<sec>
<title>Comparison between FTWBM and ATWBM</title>
<p>In the FTWBM strategy, a limited batch size within the matching time window constrains the available matching opportunities for both suppliers and recipients. This restriction leads to suboptimal resource matching and diminished matching rates, consequently increasing the average waiting time. The restricted time window allows only a limited number of supply and demand pairs to be successfully matched, requiring other resources to await the subsequent time window for potential matching. In this context, while the waiting time may be brief, the overall matching rate remains low. Conversely, when the batch size of the matching time window is excessively large, the number of participating supply and demand pairs escalates significantly. This increase can improve the matching rate for both parties, as more resources are allowed to find appropriate matches. However, this approach also complicates the matching process, as the system must handle a larger volume of matching requests. Consequently, this may result in longer online waiting times for recipients, as the matching process may require additional time to identify suitable matches. Therefore, this study aims to determine a relatively optimal matching time window that effectively balances the matching rate and average waiting time through experimental analysis. Nonetheless, in contexts where the progression of the epidemic is unpredictable, and both suppliers and recipients experience dynamic changes, this optimal point may not remain constant. Furthermore, this study corroborates that instant matching is generally less effective in terms of matching outcomes when compared to delayed batch matching.</p>
<p>In comparison to the FTWBM strategy, the optimal performance in partially optimistic scenarios is generally similar to that observed with <italic>bs</italic> &#x0003D; 3. In fully optimistic scenarios, the optimal performance also closely resembles that associated with <italic>bs</italic> &#x0003D; 2. The optimal window size in the FTWBM strategy outperforms the results of the ATWBM strategy. However, the ATWBM strategy demonstrates greater effectiveness in adapting to the dynamic changes in epidemic prevention and control, particularly in partially optimistic scenarios. By optimizing the control parameters of the adaptive time window algorithm, the matching performance can be continuously enhanced. In terms of optimizing matching outcomes, the ATWBM strategy holds a more significant advantage over the FTWBM strategy.</p></sec>
<sec>
<title>Comparison of different MBA algorithms</title>
<p>This study compares the performance differences among Upper Confidence Bound (UCB), Thompson Sampling (TS) and &#x003B5;-Greedy and calculate the corresponding cumulative regret of the algorithm. According to <xref ref-type="fig" rid="F4">Figure 4</xref>, the two box plots compare the performance of three reinforcement learning algorithms across two key metrics: average match rate (depicted in the left plot) and average waiting time (shown in the right plot). In the left plot, UCB demonstrates the most favorable performance. It features the highest median (indicated by the red line) and mean (marked by the green diamond), along with a relatively compact box that signifies a narrow interquartile range, implying consistent and high match rates. Conversely, &#x003B5;-Greedy exhibits a wider box and a lower median, with whiskers extending to both low and high extremes, reflecting greater variability in its match rate. TS falls in between: its median match rate is positioned between those of &#x003B5;-Greedy and UCB, yet it includes outliers with exceptionally low match rates, indicating less stability than UCB. In the right plot, &#x003B5;-Greedy shows the lowest median and mean waiting times. However, it also contains outliers with extremely high waiting times, suggesting that while it typically has short waiting periods, there are instances of significant delays in the process. The UCB&#x00027;s box is centered at a moderate level, indicating moderately stable waiting times without extreme outliers. TS has a higher median and mean waiting time than the other two algorithms. Its whiskers extend to both very low and very high values, indicating that its waiting time is less stable and more variable than that of both &#x003B5;-Greedy and UCB. In summary, UCB stands out for its excellent and stable average matching rate, making it a leader in terms of successful matching consistency. &#x003B5;-Greedy performs the shortest average waiting time but suffers from greater variability.</p>
<fig position="float" id="F4">
<label>Figure 4</label>
<caption><p>Results of &#x003B5;-Greedy, UCB, and Thompson Sampling. Each boxplot shows median (red line), interquartile range (box), whiskers (1.5 &#x000D7; IQR), outliers (circles), and mean (green diamond).</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpubh-13-1644499-g0004.tif">
<alt-text content-type="machine-generated">Box plots comparing three strategies: epsilon-Greedy, UCB, and TS. The left plot shows average match rates, with values between 0.4 and 1.0. The right plot shows average waiting times, ranging from 5 to 30. Median, quartiles, and outliers are indicated.</alt-text>
</graphic>
</fig>
<p><xref ref-type="table" rid="T3">Table 3</xref> compares three reinforcement learning strategies&#x02014;&#x003B5;-Greedy, Thompson Sampling (TS), and Upper Confidence Bound (UCB)&#x02014;highlighting significant differences in matching performance, as quantified by the average match rate (AR), while showing no statistically significant differences in average waiting time (AT). For AR, UCB achieves the highest mean (0.845) with a narrow 95% confidence interval [0.780, 0.910], which does not overlap with that of &#x003B5;-Greedy ([0.575, 0.730]), indicating a highly significant improvement. TS performs moderately (0.726, [0.636, 0.815]) and shows partial overlap with both &#x003B5;-Greedy and UCB, suggesting no clear advantage over &#x003B5;-Greedy but possibly inferior to UCB. Conversely, for AT, all three methods show overlapping 95% CIs&#x02014;ranging from [10.287, 13.849] (UCB) to [11.348, 14.724] (TS)&#x02014;indicating no statistically significant differences in delay. Notably, UCB and TS have much wider CIs than &#x003B5;-Greedy due to smaller sample sizes and higher variability, reducing their reliability. Overall, UCB emerges as the most effective strategy, offering significantly higher match rates without demonstrably increasing waiting time, and this is supported by high statistical precision. &#x003B5;-Greedy provides shorter delays with reliable estimates but at the cost of lower matching efficiency.</p>
<table-wrap position="float" id="T3">
<label>Table 3</label>
<caption><p>Statistical results of average match rate and average waiting time for &#x003B5;-Greedy, UCB, and Thompson Sampling.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th/>
<th valign="top" align="center" colspan="3"><bold>The average match rate (AR)</bold></th>
<th valign="top" align="center" colspan="3"><bold>The average waiting time(AT)</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td/>
<td valign="top" align="center">&#x003B5;<bold>-Greedy</bold></td>
<td valign="top" align="center"><bold>Thompson Sampling (TS)</bold></td>
<td valign="top" align="center"><bold>Upper Confidence Bound (UCB)</bold></td>
<td valign="top" align="center">&#x003B5;<bold>-Greedy</bold></td>
<td valign="top" align="center"><bold>Thompson Sampling (TS)</bold></td>
<td valign="top" align="center"><bold>Upper Confidence Bound (UCB)</bold></td>
</tr>
<tr>
<td valign="top" align="left">n</td>
<td valign="top" align="center">38</td>
<td valign="top" align="center">28</td>
<td valign="top" align="center">18</td>
<td valign="top" align="center">38</td>
<td valign="top" align="center">28</td>
<td valign="top" align="center">18</td>
</tr>
<tr>
<td valign="top" align="left"><italic>median</italic></td>
<td valign="top" align="center">0.678</td>
<td valign="top" align="center">0.757</td>
<td valign="top" align="center">0.889</td>
<td valign="top" align="center">11.625</td>
<td valign="top" align="center">12.679</td>
<td valign="top" align="center">12.373</td>
</tr>
<tr>
<td valign="top" align="left"><inline-formula><mml:math id="M25"><mml:mover accent="true"><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mo>&#x00304;</mml:mo></mml:mover></mml:math></inline-formula></td>
<td valign="top" align="center">0.653</td>
<td valign="top" align="center">0.726</td>
<td valign="top" align="center">0.845</td>
<td valign="top" align="center">11.740</td>
<td valign="top" align="center">13.036</td>
<td valign="top" align="center">12.068</td>
</tr>
<tr>
<td valign="top" align="left"><italic>s</italic></td>
<td valign="top" align="center">0.236</td>
<td valign="top" align="center">0.232</td>
<td valign="top" align="center">0.131</td>
<td valign="top" align="center">2.731</td>
<td valign="top" align="center">4.353</td>
<td valign="top" align="center">3.581</td>
</tr>
<tr>
<td valign="top" align="left">SE</td>
<td valign="top" align="center">0.038</td>
<td valign="top" align="center">0.044</td>
<td valign="top" align="center">0.031</td>
<td valign="top" align="center">0.443</td>
<td valign="top" align="center">0.823</td>
<td valign="top" align="center">0.844</td>
</tr>
<tr>
<td valign="top" align="left">ME</td>
<td valign="top" align="center">0.078</td>
<td valign="top" align="center">0.090</td>
<td valign="top" align="center">0.065</td>
<td valign="top" align="center">0.898</td>
<td valign="top" align="center">1.688</td>
<td valign="top" align="center">1.781</td>
</tr>
<tr>
<td valign="top" align="left">95% CI</td>
<td valign="top" align="center">[0.575, 0.730]</td>
<td valign="top" align="center">[0.636, 0.815]</td>
<td valign="top" align="center">[0.780, 0.910]</td>
<td valign="top" align="center">[10.842, 12.638]</td>
<td valign="top" align="center">[11.348, 14.724]</td>
<td valign="top" align="center">[10.287, 13.849]</td>
</tr>
<tr>
<td valign="top" align="left"><italic>CIW</italic></td>
<td valign="top" align="center">0.155</td>
<td valign="top" align="center">0.179</td>
<td valign="top" align="center">0.13</td>
<td valign="top" align="center">1.796</td>
<td valign="top" align="center">3.376</td>
<td valign="top" align="center">3.562</td>
</tr></tbody>
</table>
</table-wrap>
</sec>
<sec>
<title>Ethics and fairness</title>
<p>The core nature of anti-epidemic resource allocation lies in its public health emergency attribute&#x02014;that is, resource allocation must first serve the collective goal of rapidly controlling the spread of the epidemic and reducing the overall risk of infection or death. This premise defines the trade-off principle, which states that group fairness takes priority over absolute individual fairness. The adaptive time window selection and G-HMBMC multi-stage matching algorithm prioritize ensuring that high-risk groups have access to anti-epidemic resources, which aligns with the emergency attribute of anti-epidemic resource allocation. Meanwhile, by selecting a matching time window with the minimum average waiting time, the algorithm compensates for the potential individual unfairness that may result from prioritizing the group. Through differentiated adaptation in the time dimension and hierarchical regulation during the matching process, the algorithm safeguards the core goal of group fairness. It avoids systematic unfairness at the individual level. Ultimately, it achieves synergy between public health efficiency and fairness.</p></sec>
<sec>
<title>Complexity analysis</title>
<p>The proposed online bandit algorithms (greedy, TS, or UCB) for a dynamic matching problem jointly optimize the matching configuration and arm selection in a sequential decision loop. The overall time complexity is predominantly determined by the main experimental loop and the graph matching algorithms employed within it, rather than by the bandit selection logic itself. The core bandit algorithms, whether Thompson Sampling or UCB, are highly efficient. With a fixed number of arms (K = 6), operations such as choosing an arm and updating the reward estimates are performed in constant time, O(K) = O(1), per time step. The primary computational bottleneck arises from the matching operations (Greedy or Hungarian) required for each selected arm in every iteration. The worst-case time complexity is governed by the Hungarian algorithm, which has a complexity of O(max(N, M)<sup>&#x02227;</sup>3) for bipartite graphs with sets of sizes N and M. This operation is executed a fixed number of times (e.g., six times for different data subsets) per time step T. Consequently, the overall worst-case time complexity is O(T<sup>&#x0002A;</sup> max(N, M)<sup>&#x02227;</sup>3). If a greedy matching algorithm is used instead, this could be reduced to approximately O(T<sup>&#x0002A;</sup>N<sup>&#x0002A;</sup>M). The loop count T is not a direct input variable but is determined by the dynamics of the external environment; however, it contributes a linear factor to the total running time. Therefore, the scalability of the algorithm is highly sensitive to the sizes of the sets being matched (N and M). Regarding space complexity, the requirements are driven by the data structures required for the matching process. Bandit algorithms are memory-efficient and require only O(K) space to store parameters. Significant memory consumption occurs within the experimental loop. The algorithm must store the sets of bipartite graphs, which requires O(N&#x0002B;M) space. Furthermore, matching algorithms, particularly the Hungarian algorithm, often require an O(N<sup>&#x0002A;</sup>M) distance matrix or similar data structures to operate. The bandit list, which records the estimated values for all arms at each time step, consumes O(T<sup>&#x0002A;</sup>K) space, which is typically dominated by the O(N<sup>&#x0002A;</sup>M) requirement for the matching matrices when N and M are large. Thus, the overall space complexity is O(N<sup>&#x0002A;</sup>M). In practice, for large graphs, the O(N<sup>&#x0002A;</sup>M) term is the dominant memory constraint.</p></sec></sec></sec>
<sec sec-type="conclusions" id="s6">
<title>Conclusion</title>
<p>The primary contributions and managerial insights of this study are as follows. First, this study showed that delayed batch matching generally produces superior overall matching results than instant matching in the context of online matching of anti-epidemic resources. As the matching time window expands, the average waiting time initially decreases, then rises again, while the average matching rate continues to increase to a certain extent. Therefore, healthcare operations managers should strive to find a balance between average waiting time and average matching rate when selecting a matching time window, prioritizing a window that offers low average waiting time and high average matching rate. Secondly, there is no universally optimal or static matching time window in the context of unpredictable epidemic developments and dynamic fluctuations in supply and demand. Healthcare operations managers should periodically adjust the matching time window based on trends in epidemic progression and resource availability. In scenarios where the epidemic spreads rapidly, resulting in increased resource requests from the infected demand side and potential supply shortages, a larger matching time window can increase the average matching rate; however, this may lead to longer waiting times. Conversely, a smaller matching time window may also be effectively utilized. Thirdly, experiments conducted on the proposed adaptive time window matching strategy indicate that a higher exploration probability significantly improves resource matching efficiency. Given the uncertain supply and demand conditions during an epidemic, maintaining a high level of exploration within the matching time window is crucial for effective resource allocation. Additionally, in practical applications, health operations managers also need to determine accurate travel time in conjunction with navigation maps.</p>
<p>While the model presented effectively addresses the online matching problem of anti-epidemic resources, certain limitations necessitate further investigation. This study focuses solely on the impact of temporal factors on the allocation of epidemic prevention and control resources. However, other critical factors, such as resource supply capacity, the cross-regional distribution of resource shortages, population concentration, and spatial distribution, also require substantial research attention. Simultaneously, the issue of balancing efficiency and fairness in epidemic resource allocation is equally worthy of research consideration.</p></sec>
</body>
<back>
<sec sec-type="data-availability" id="s7">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec sec-type="author-contributions" id="s8">
<title>Author contributions</title>
<p>ZW: Formal analysis, Project administration, Validation, Supervision, Data curation, Methodology, Visualization, Software, Writing &#x02013; review &#x00026; editing, Writing &#x02013; original draft, Resources, Investigation, Conceptualization. SP: Resources, Funding acquisition, Writing &#x02013; review &#x00026; editing, Formal analysis, Software, Writing &#x02013; original draft, Data curation, Conceptualization, Validation, Methodology, Visualization, Project administration, Supervision, Investigation. SH: Formal analysis, Resources, Visualization, Project administration, Writing &#x02013; review &#x00026; editing, Supervision, Conceptualization, Software, Methodology, Data curation, Investigation, Validation.</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="s10">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p></sec>
<sec sec-type="disclaimer" id="s11">
<title>Publisher&#x00027;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec><sec sec-type="supplementary-material" id="s12">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpubh.2025.1644499/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpubh.2025.1644499/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Data_Sheet_1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/></sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ma</surname> <given-names>J</given-names></name> <name><surname>Xu</surname> <given-names>J</given-names></name> <name><surname>Zhao</surname> <given-names>XL</given-names></name> <name><surname>Huo</surname> <given-names>SL</given-names></name> <name><surname>Duan</surname> <given-names>XL</given-names></name> <name><surname>Mu</surname> <given-names>YS</given-names></name> <etal/></person-group>. <article-title>Several major issues concerning the environmental transmission and risk prevention of SARS-CoV-2</article-title>. <source>Science China-Earth Sciences.</source> (<year>2022</year>) <volume>65</volume>:<fpage>1047</fpage>&#x02013;<lpage>56</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11430-021-9918-9</pub-id><pub-id pub-id-type="pmid">35578665</pub-id></mixed-citation>
</ref>
<ref id="B2">
<label>2.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Fischer</surname> <given-names>GS</given-names></name> <name><surname>Righi</surname> <given-names>RDR</given-names></name> <name><surname>Ramos</surname> <given-names>GDO</given-names></name> <name><surname>da Costa</surname> <given-names>C</given-names></name> <name><surname>Rodrigues</surname> <given-names>JJPC</given-names></name></person-group>. <article-title>ElHealth: Using Internet of Things and data prediction for elastic management of human resources in smart hospitals</article-title>. <source>Eng Appl Artif Intell.</source> (<year>2020</year>) <volume>87</volume>:<fpage>103285</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.engappai.2019.103285</pub-id></mixed-citation>
</ref>
<ref id="B3">
<label>3.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Shapley</surname> <given-names>L</given-names></name> <name><surname>Scarf</surname> <given-names>H</given-names></name></person-group>. <article-title>On cores and indivisibility</article-title>. <source>J Mathem Econ.</source> (<year>1974</year>) <volume>1</volume>:<fpage>23</fpage>&#x02013;<lpage>37</lpage>. doi: <pub-id pub-id-type="doi">10.1016/0304-4068(74)90033-0</pub-id></mixed-citation>
</ref>
<ref id="B4">
<label>4.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Shapley</surname> <given-names>LS</given-names></name> <name><surname>Shubik</surname> <given-names>M</given-names></name></person-group>. <article-title>The assignment game I: The core</article-title>. <source>Int J Game Theory.</source> (<year>1971</year>) <volume>1</volume>:<fpage>111</fpage>&#x02013;<lpage>30</lpage>. doi: <pub-id pub-id-type="doi">10.1007/BF01753437</pub-id></mixed-citation>
</ref>
<ref id="B5">
<label>5.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Roth</surname> <given-names>AE</given-names></name></person-group>. <article-title>Incentive compatibility in a market with indivisible goods</article-title>. <source>Econ Lett.</source> (<year>1982</year>) <volume>9</volume>:<fpage>127</fpage>&#x02013;<lpage>32</lpage>. doi: <pub-id pub-id-type="doi">10.1016/0165-1765(82)90003-9</pub-id></mixed-citation>
</ref>
<ref id="B6">
<label>6.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Roth</surname> <given-names>AE</given-names></name></person-group>. <article-title>Marketplaces, markets, and market design</article-title>. <source>Am Econ Rev.</source> (<year>2018</year>) <volume>108</volume>:<fpage>1609</fpage>&#x02013;<lpage>58</lpage>. doi: <pub-id pub-id-type="doi">10.1257/aer.108.7.1609</pub-id><pub-id pub-id-type="pmid">30091861</pub-id></mixed-citation>
</ref>
<ref id="B7">
<label>7.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Roth</surname> <given-names>AE</given-names></name></person-group>. <article-title>The college admissions problem is not equivalent to the marriage problem</article-title>. <source>J Econ Theory.</source> (<year>1985</year>) <volume>36</volume>:<fpage>277</fpage>&#x02013;<lpage>88</lpage>. doi: <pub-id pub-id-type="doi">10.1016/0022-0531(85)90106-1</pub-id></mixed-citation>
</ref>
<ref id="B8">
<label>8.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname> <given-names>Z</given-names></name> <name><surname>Tang</surname> <given-names>ZG</given-names></name> <name><surname>Wu</surname> <given-names>X</given-names></name> <name><surname>Zhang</surname> <given-names>Y</given-names></name></person-group>. <article-title>Online vertex-weighted bipartite matching: beating 1-1/e with random arrivals</article-title>. <source>ACM Trans Algorithms.</source> (<year>2019</year>) <volume>15</volume>:<fpage>38</fpage>. doi: <pub-id pub-id-type="doi">10.1145/3326169</pub-id></mixed-citation>
</ref>
<ref id="B9">
<label>9.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Torrico</surname> <given-names>A</given-names></name> <name><surname>Toriello</surname> <given-names>A</given-names></name></person-group>. <article-title>Dynamic relaxations for online bipartite matching</article-title>. <source>Informs J Comput.</source> (<year>2022</year>) <volume>34</volume>:<fpage>1871</fpage>&#x02013;<lpage>84</lpage>. doi: <pub-id pub-id-type="doi">10.1287/ijoc.2022.1168</pub-id></mixed-citation>
</ref>
<ref id="B10">
<label>10.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Fahrbach</surname> <given-names>M</given-names></name> <name><surname>Zadimoghaddam</surname> <given-names>M</given-names></name> <name><surname>Huang</surname> <given-names>Z</given-names></name> <name><surname>Tao</surname> <given-names>R</given-names></name></person-group>. <article-title>Edge-weighted online bipartite matching</article-title>. <source>J ACM</source>. (<year>2022</year>) <volume>69</volume>:<fpage>45</fpage>. doi: <pub-id pub-id-type="doi">10.1145/3556971</pub-id></mixed-citation>
</ref>
<ref id="B11">
<label>11.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>W</given-names></name> <name><surname>Zheng</surname> <given-names>J</given-names></name> <name><surname>Yu</surname> <given-names>H</given-names></name> <name><surname>Chen</surname> <given-names>G</given-names></name> <name><surname>Chen</surname> <given-names>Y</given-names></name> <name><surname>Li</surname> <given-names>D</given-names></name></person-group>. <article-title>Online learning bipartite matching with non-stationary distributions</article-title>. <source>ACM Trans Knowl Discov Data.</source> (<year>2022</year>) <volume>16</volume>:<fpage>83</fpage>. doi: <pub-id pub-id-type="doi">10.1145/3502734</pub-id></mixed-citation>
</ref>
<ref id="B12">
<label>12.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Goyal</surname> <given-names>V</given-names></name> <name><surname>Udwani</surname> <given-names>R</given-names></name></person-group>. <article-title>Online matching with stochastic rewards: optimal competitive ratio via path-based formulation</article-title>. <source>Oper Res.</source> (<year>2023</year>) <volume>71</volume>:<fpage>563</fpage>&#x02013;<lpage>80</lpage>. doi: <pub-id pub-id-type="doi">10.1287/opre.2022.2345</pub-id></mixed-citation>
</ref>
<ref id="B13">
<label>13.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bai</surname> <given-names>G</given-names></name> <name><surname>Velamuri</surname> <given-names>SR</given-names></name></person-group>. <article-title>Contextualizing the sharing economy</article-title>. <source>J Managem Stud.</source> (<year>2021</year>) <volume>58</volume>:<fpage>977</fpage>&#x02013;<lpage>1001</lpage>. doi: <pub-id pub-id-type="doi">10.1111/joms.12652</pub-id></mixed-citation>
</ref>
<ref id="B14">
<label>14.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Slee</surname> <given-names>T</given-names></name></person-group>. <source>What&#x00027;s Yours Is Mine: Against the Sharing Economy</source>, New York, NY: OR Books. (<year>2017</year>).</mixed-citation>
</ref>
<ref id="B15">
<label>15.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>T</given-names></name></person-group>. <article-title>Trans-regional medical support in public health emergencies: a case study of Wuhan in the early COVID-19 pandemic in China</article-title>. <source>Risk Manag Healthc Policy.</source> (<year>2022</year>) <volume>15</volume>:<fpage>677</fpage>&#x02013;<lpage>83</lpage>. doi: <pub-id pub-id-type="doi">10.2147/RMHP.S346556</pub-id><pub-id pub-id-type="pmid">35449543</pub-id></mixed-citation>
</ref>
<ref id="B16">
<label>16.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Nowzari</surname> <given-names>C</given-names></name> <name><surname>Preciado</surname> <given-names>VM</given-names></name> <name><surname>Pappas</surname> <given-names>GJ</given-names></name></person-group>. <article-title>Analysis and control of epidemics: a survey of spreading processes on complex networks</article-title>. <source>IEEE Control Syst Magaz.</source> (<year>2016</year>) <volume>36</volume>:<fpage>26</fpage>&#x02013;<lpage>46</lpage>. doi: <pub-id pub-id-type="doi">10.1109/MCS.2015.2495000</pub-id></mixed-citation>
</ref>
<ref id="B17">
<label>17.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>Z-Y</given-names></name> <name><surname>Sun</surname> <given-names>M</given-names></name> <name><surname>Han</surname> <given-names>X-X</given-names></name></person-group>. <article-title>Prediction-driven collaborative emergency medical resource allocation with deep learning and optimization</article-title>. <source>J Operat Res Soc</source>. (<year>2022</year>) <volume>74</volume>:<fpage>1</fpage>&#x02013;<lpage>14</lpage>. doi: <pub-id pub-id-type="doi">10.1080/01605682.2022.2101953</pub-id></mixed-citation>
</ref>
<ref id="B18">
<label>18.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Pan</surname> <given-names>Y</given-names></name> <name><surname>Cheng</surname> <given-names>TCE</given-names></name> <name><surname>He</surname> <given-names>Y</given-names></name> <name><surname>Ng</surname> <given-names>CT</given-names></name> <name><surname>Sethi</surname> <given-names>SP</given-names></name></person-group>. <article-title>Foresighted medical resources allocation during an epidemic outbreak</article-title>. <source>Transport Res Part E: Logist Transport Rev.</source> (<year>2022</year>) <volume>164</volume>:<fpage>102762</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.tre.2022.102762</pub-id></mixed-citation>
</ref>
<ref id="B19">
<label>19.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Long</surname> <given-names>EF</given-names></name> <name><surname>Nohdurft</surname> <given-names>E</given-names></name> <name><surname>Spinler</surname> <given-names>S</given-names></name></person-group>. <article-title>Spatial resource allocation for emerging epidemics: a comparison of greedy, myopic, and dynamic policies</article-title>. <source>Manufact Serv Operat Managem.</source> (<year>2018</year>) <volume>20</volume>:<fpage>181</fpage>&#x02013;<lpage>98</lpage>. doi: <pub-id pub-id-type="doi">10.1287/msom.2017.0681</pub-id></mixed-citation>
</ref>
<ref id="B20">
<label>20.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Pei</surname> <given-names>Z</given-names></name> <name><surname>Yuan</surname> <given-names>Y</given-names></name> <name><surname>Yu</surname> <given-names>T</given-names></name> <name><surname>Li</surname> <given-names>N</given-names></name></person-group>. <article-title>Dynamic allocation of medical resources during the outbreak of epidemics</article-title>. <source>IEEE Trans Automat Sci Eng.</source> (<year>2022</year>) <volume>19</volume>:<fpage>663</fpage>&#x02013;<lpage>76</lpage>. doi: <pub-id pub-id-type="doi">10.1109/TASE.2021.3102491</pub-id></mixed-citation>
</ref>
<ref id="B21">
<label>21.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhu</surname> <given-names>X</given-names></name> <name><surname>Liu</surname> <given-names>Y</given-names></name> <name><surname>Wang</surname> <given-names>S</given-names></name> <name><surname>Wang</surname> <given-names>R</given-names></name> <name><surname>Chen</surname> <given-names>X</given-names></name> <name><surname>Wang</surname> <given-names>W</given-names></name></person-group>. <article-title>Allocating resources for epidemic spreading on metapopulation networks</article-title>. <source>Appl Math Comput.</source> (<year>2021</year>) <volume>411</volume>:<fpage>126531</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.amc.2021.126531</pub-id></mixed-citation>
</ref>
<ref id="B22">
<label>22.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Enayati</surname> <given-names>S</given-names></name> <name><surname>&#x000D6;zaltin</surname> <given-names>OY</given-names></name></person-group>. <article-title>Optimal influenza vaccine distribution with equity</article-title>. <source>Eur J Oper Res.</source> (<year>2020</year>) <volume>283</volume>:<fpage>714</fpage>&#x02013;<lpage>25</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ejor.2019.11.025</pub-id></mixed-citation>
</ref>
<ref id="B23">
<label>23.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>XW</given-names></name> <name><surname>Chong</surname> <given-names>WF</given-names></name> <name><surname>Feng</surname> <given-names>RH</given-names></name> <name><surname>Zhang</surname> <given-names>LF</given-names></name></person-group>. <article-title>Pandemic risk management: resources contingency planning and allocation</article-title>. <source>Insurance Mathem Econ.</source> (<year>2021</year>) <volume>101</volume>:<fpage>359</fpage>&#x02013;<lpage>83</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.insmatheco.2021.08.001</pub-id><pub-id pub-id-type="pmid">34803199</pub-id></mixed-citation>
</ref>
<ref id="B24">
<label>24.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gatouillat</surname> <given-names>A</given-names></name> <name><surname>Badr</surname> <given-names>Y</given-names></name> <name><surname>Massot</surname> <given-names>B</given-names></name> <name><surname>Sejdi&#x00107;</surname> <given-names>E</given-names></name></person-group>. <article-title>Internet of medical things: a review of recent contributions dealing with cyber-physical systems in medicine</article-title>. <source>IEEE Intern Things J.</source> (<year>2018</year>) <volume>5</volume>:<fpage>3810</fpage>&#x02013;<lpage>22</lpage>. doi: <pub-id pub-id-type="doi">10.1109/JIOT.2018.2849014</pub-id></mixed-citation>
</ref>
<ref id="B25">
<label>25.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ashlagi</surname> <given-names>I</given-names></name> <name><surname>Nikzad</surname></name> <name><surname>A</surname></name> <name><surname>Strack</surname> <given-names>P</given-names></name></person-group>. <article-title>Matching in dynamic imbalanced markets</article-title>. <source>Rev Econ Stud</source>. (<year>2022</year>) <volume>90</volume>:<fpage>1084</fpage>&#x02013;<lpage>24</lpage>. doi: <pub-id pub-id-type="doi">10.1093/restud/rdac044</pub-id></mixed-citation>
</ref>
<ref id="B26">
<label>26.</label>
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Sutton</surname> <given-names>RS</given-names></name> <name><surname>Barto</surname> <given-names>AG</given-names></name></person-group>. <source>Reinforcement Learning: An Introduction</source>. <publisher-loc>Cambridge, MA</publisher-loc>: <publisher-name>The MIT Press</publisher-name>. (<year>2018</year>).</mixed-citation>
</ref>
<ref id="B27">
<label>27.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bouneffouf</surname> <given-names>D</given-names></name> <name><surname>Rish</surname> <given-names>I</given-names></name></person-group>. <article-title>A survey on practical applications of multi-armed and contextual bandits</article-title>. <source>arXiv</source> [preprint] arXiv:1904.10040. (<year>2019</year>). doi: <pub-id pub-id-type="doi">10.48550/arXiv.1904.10040</pub-id></mixed-citation>
</ref>
<ref id="B28">
<label>28.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sutton</surname> <given-names>RS</given-names></name></person-group>. <article-title>Learning to predict by the methods of temporal differences</article-title>. <source>Mach Learn.</source> (<year>1988</year>) <volume>3</volume>:<fpage>9</fpage>&#x02013;<lpage>44</lpage>. doi: <pub-id pub-id-type="doi">10.1007/BF00115009</pub-id></mixed-citation>
</ref>
<ref id="B29">
<label>29.</label>
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>L</given-names></name> <name><surname>Littman</surname> <given-names>ML</given-names></name> <name><surname>Mansley</surname> <given-names>CR</given-names></name></person-group>. <article-title>Online exploration in least-squares policy iteration</article-title>. In: <source>AAMAS &#x00027;09.</source> <publisher-loc>Richland, SC</publisher-loc>: <publisher-name>International Foundation for Autonomous Agents and Multiagent Systems</publisher-name> (<year>2009</year>). p. <fpage>733</fpage>&#x02013;<lpage>9</lpage>.</mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn fn-type="custom" custom-type="edited-by" id="fn0001">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1395648/overview">Paolo Di Giamberardino</ext-link>, Sapienza University of Rome, Italy</p>
</fn>
<fn fn-type="custom" custom-type="reviewed-by" id="fn0002">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1762307/overview">Zongliang Wen</ext-link>, Xuzhou Medical University, China</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3149067/overview">Thattapon Surasak</ext-link>, King Mongkut&#x00027;s University of Technology North Bangkok, Thailand</p>
</fn>
</fn-group>
</back>
</article>