<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Neurorobot.</journal-id>
<journal-title>Frontiers in Neurorobotics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Neurorobot.</abbrev-journal-title>
<issn pub-type="epub">1662-5218</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fnbot.2024.1355857</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Neuroscience</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>YOLOv8-ACU: improved YOLOv8-pose for facial acupoint detection</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Yuan</surname> <given-names>Zijian</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x02020;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/2603780/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Shao</surname> <given-names>Pengwei</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x02020;</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Li</surname> <given-names>Jinran</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/2615169/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Wang</surname> <given-names>Yinuo</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhu</surname> <given-names>Zixuan</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Qiu</surname> <given-names>Weijie</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Chen</surname> <given-names>Buqun</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Tang</surname> <given-names>Yan</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Han</surname> <given-names>Aiqing</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c002"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1540324/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>College of Management, Beijing University of Chinese Medicine</institution>, <addr-line>Beijing</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>Beijing No.80 High School, International Department</institution>, <addr-line>Beijing</addr-line>, <country>China</country></aff>
<aff id="aff3"><sup>3</sup><institution>College of Acupuncture and Massage, Beijing University of Chinese Medicine</institution>, <addr-line>Beijing</addr-line>, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Xianmin Wang, Guangzhou University, China</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Ningbo Yu, Nankai University, China</p>
<p>Bo Jin, University of Coimbra, Portugal</p></fn>
<corresp id="c001">&#x0002A;Correspondence: Yan Tang <email>tangyan97_1017&#x00040;sina.com</email></corresp>
<corresp id="c002">Aiqing Han <email>aqhan&#x00040;hotmail.com</email></corresp>
<fn fn-type="equal" id="fn001"><p>&#x02020;These authors have contributed equally to this work and share first authorship</p></fn></author-notes>
<pub-date pub-type="epub">
<day>01</day>
<month>02</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>18</volume>
<elocation-id>1355857</elocation-id>
<history>
<date date-type="received">
<day>20</day>
<month>12</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>17</day>
<month>01</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2024 Yuan, Shao, Li, Wang, Zhu, Qiu, Chen, Tang and Han.</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Yuan, Shao, Li, Wang, Zhu, Qiu, Chen, Tang and Han</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<sec>
<title>Introduction</title>
<p>Acupoint localization is integral to Traditional Chinese Medicine (TCM) acupuncture diagnosis and treatment. Employing intelligent detection models for recognizing facial acupoints can substantially enhance localization accuracy.</p></sec>
<sec>
<title>Methods</title>
<p>This study introduces an advancement in the YOLOv8-pose keypoint detection algorithm, tailored for facial acupoints, and named YOLOv8-ACU. This model enhances acupoint feature extraction by integrating ECA attention, replaces the original neck module with a lighter Slim-neck module, and improves the loss function for GIoU.</p></sec>
<sec>
<title>Results</title>
<p>The YOLOv8-ACU model achieves impressive accuracy, with an mAP&#x00040;0.5 of 97.5% and an mAP&#x00040;0.5&#x02013;0.95 of 76.9% on our self-constructed datasets. It also marks a reduction in model parameters by 0.44M, model size by 0.82 MB, and GFLOPs by 9.3%.</p></sec>
<sec>
<title>Discussion</title>
<p>With its enhanced recognition accuracy and efficiency, along with good generalization ability, YOLOv8-ACU provides significant reference value for facial acupoint localization and detection. This is particularly beneficial for Chinese medicine practitioners engaged in facial acupoint research and intelligent detection.</p></sec></abstract>
<kwd-group>
<kwd>Chinese medicine acupoints</kwd>
<kwd>YOLOv8-pose</kwd>
<kwd>keypoint detection</kwd>
<kwd>ECA-net</kwd>
<kwd>slim-neck</kwd>
<kwd>GIoU</kwd>
</kwd-group>
<counts>
<fig-count count="10"/>
<table-count count="4"/>
<equation-count count="8"/>
<ref-count count="47"/>
<page-count count="15"/>
<word-count count="8603"/>
</counts>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>Introduction</title>
<p>Since the 1970s, WHO has been actively promoting acupuncture to the world, setting up acupuncture training institutions in many countries, supporting the creation of the World Federation of Acupuncture Societies (WFA), announcing many times the appropriate conditions for acupuncture treatment, encouraging global patients to choose acupuncture therapy, and striving to promote the internationalization and standardization of acupuncture (Lim, <xref ref-type="bibr" rid="B20">2010</xref>). Acupuncture and massage are important parts of Chinese medicine, which is based on the theory of Chinese medicine&#x00027;s internal organs and meridians, with acupuncture and massage as the main treatment, and is an important means used to prevent and treat diseases and eliminate fatigue. By stimulating specific points on the human body, acupuncture and massage can regulate the body&#x00027;s qi and blood circulation and the balance of yin and yang, so as to achieve the purpose of treating diseases and relieving fatigue. Acupuncture and massage have been widely used in clinical practice and are gradually gaining attention and recognition worldwide. Acupoint localization serves as a pivotal component in the modalities of acupuncture and tuina therapy, where it&#x00027;s precision holds a direct correlation with the resultant therapeutic efficacy (Zheng, <xref ref-type="bibr" rid="B44">2022</xref>). The imprecision in acupoint targeting may culminate in the ineffectuality of acupuncture interventions, potentially precipitating severe repercussions including, but not limited to, localized trauma, neural impairment, aneurysmal formations, ocular injuries, and incidences of needle fracture (Godson and Wardle, <xref ref-type="bibr" rid="B10">2019</xref>). Pertaining to the human facial region, which is characterized by a plethora of acupoints each with distinct functionalities and in close proximity to one another, the task of exact acupoint identification is further complicated owing to the inter-individual anatomical variability, thereby presenting substantial challenges in accurate acupoint delineation (Lee et al., <xref ref-type="bibr" rid="B17">2020</xref>). In clinical practice, the commonly used methods of taking acupoints can be divided into the method of anatomical marking on the body surface, the method of bone measurement and the method of body measurement (Zheng et al., <xref ref-type="bibr" rid="B46">2005</xref>; Lin and Yi, <xref ref-type="bibr" rid="B21">2019</xref>), all of which are artificial positioning of acupoints from the visual level, and the degree of accuracy is highly dependent on the professional skills and experience of physicians. Due to the complexity of human anatomy and individual differences, artificial positioning methods inevitably have certain subjectivity and errors, which affect the accuracy of acupoint positioning. Therefore, it is necessary to develop a new method to improve the objectivity, efficiency and accuracy of acupoint positioning to assist practitioners in prevention and treatment.</p>
<p>Artificial intelligence techniques may help to build intelligent, efficient and accurate models for point detection and localization. In recent years, AI techniques have been widely used in the fields of human behavior recognition, facial feature recognition and keypoint detection (Berretti et al., <xref ref-type="bibr" rid="B1">2011</xref>; Maji et al., <xref ref-type="bibr" rid="B25">2022</xref>; Pranavan et al., <xref ref-type="bibr" rid="B28">2023</xref>; Zhang et al., <xref ref-type="bibr" rid="B43">2023</xref>). However, as the available research deepens, the existing acupoint detection models have problems such as over-reliance on external devices such as infrared, insufficient mining of feature representations, and low accuracy and robustness of acupoint detection (Zhang et al., <xref ref-type="bibr" rid="B43">2023</xref>). These issues seriously affect the generality of the models, and researchers are gradually recognizing the advantages of high-precision, lightweight detection models for better migration to mobile or embedded devices, and can achieve high-precision performance comparable to that of larger models.</p>
<p>Due to the problems of oversized models, low accuracy and insufficient robustness in existing studies, this study innovatively adopts the YOLOv8-ACU algorithm for facial acupoint recognition. Since acupoints do not have clear physical features or geometric shapes on the human surface, and locating facial acupoints by Chinese medicine practitioners is actually a process of locating facial regions or points, this study combines the facial acupoint detection task with face keypoint detection, and divides the task of facial acupoint detection into two aspects: identification of the type of acupoints and localization of the acupoints. Deep learning and computer vision techniques are used to recognize human facial features and acupoint location features, so as to achieve intelligent acupoint detection and assist doctors in acupoint treatment. The main contributions of this research are summarized as follows:</p>
<list list-type="simple">
<list-item><p>(1) The YOLOv8-pose model is applied to the self-constructed facial acupoints dataset and it has the advantages of high efficiency, speed, and accuracy compared with other models.</p></list-item>
<list-item><p>(2) The ECA channel attention mechanism is used to reduce the extraction of features outside the face, and is able to focus more on the extraction of facial acupoint features.</p></list-item>
<list-item><p>(3) Replacing the original neck module in YOLOv8-pose with Slim-neck can improve the recognition accuracy while lightening the weight.</p></list-item>
<list-item><p>(4) Replacing the loss function can more effectively improve the recognition effect and convergence speed of the model.</p></list-item>
</list>
<p>The algorithm used in this research has the advantages of high efficiency, multi-task processing, high accuracy, and robustness improvement, which better meets the needs of keypoint detection of facial acupoints. It possesses extremely important practical significance and clinical application potential. The specific implementation tools utilized in this algorithm are illustrated in <xref ref-type="table" rid="T1">Table 1</xref>.</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>Implementing tools.</p></caption>
<table frame="box" rules="all">
<thead>
<tr style="background-color:#919498;color:#ffffff">
<th valign="top" align="left"><bold>Parameter</bold></th>
<th valign="top" align="left"><bold>Type</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">CPU</td>
<td valign="top" align="left">Intel(R) Core(TM) i9&#x02013;11900H</td>
</tr>
<tr>
<td valign="top" align="left">Memory (GB)</td>
<td valign="top" align="left">16G</td>
</tr>
<tr>
<td valign="top" align="left">GPU</td>
<td valign="top" align="left">NVIDIA GeForce RTX 3060</td>
</tr>
<tr>
<td valign="top" align="left">Graphics Memory (GB)</td>
<td valign="top" align="left">6G</td>
</tr>
<tr>
<td valign="top" align="left">Training environment</td>
<td valign="top" align="left">CUDA 11.8 CUDNN 8.7</td>
</tr>
<tr>
<td valign="top" align="left">operating system</td>
<td valign="top" align="left">Windows 11 (64-bit)</td>
</tr>
<tr>
<td valign="top" align="left">development environment (computer)</td>
<td valign="top" align="left">Python3.10.11 Pytorch2.0.0</td>
</tr></tbody>
</table>
</table-wrap>
</sec>
<sec id="s2">
<title>Related works</title>
<p>In recent years, facial image processing, as a pivotal technology, has propelled technological advancements in domains such as facial recognition and image analysis. Deng et al. (<xref ref-type="bibr" rid="B6">2019</xref>) introduced a novel loss function, ArcFace, aimed at enhancing the capability of deep convolutional neural networks in feature learning. This innovation not only optimized the efficiency of feature extraction but also laid a foundational framework for the subsequent evolution of facial image processing technologies. Utilizing the efficient feature extraction methodology of ArcFace, Jin et al. (<xref ref-type="bibr" rid="B15">2022</xref>) applied deep learning models, originally developed for facial recognition tasks, to facial diagnostics. This cross-disciplinary application underscores the versatility and generalizability of deep learning models, offering new perspectives for medical image analysis and diagnostics. To further advance facial image processing, innovative techniques such as the generation of pseudo-depth information from traditional 2D RGB images using Generative Adversarial Networks (GANs) have been proposed (Jin et al., <xref ref-type="bibr" rid="B14">2020</xref>). These advancements not only enhance the accuracy of facial recognition but also enable more complex facial recognition capabilities in resource-constrained settings. Concurrent with the rapid development of facial image processing, facial keypoint detection has emerged as a research focus, categorically divided into traditional facial keypoint detection methods and those based on deep learning. Among them, the traditional methods require manual design, feature extraction, and construction of subsequent classification or regression models, which can be further divided into parametric shape model-based methods and cascade shape regression-based methods. Among them, two representative algorithms based on parametric shape model approach are Active Shape Model (ASM) (Cootes et al., <xref ref-type="bibr" rid="B5">1995</xref>), Active Appearance Models (AAM) (Cootes et al., <xref ref-type="bibr" rid="B4">1998</xref>). ASM is a face keypoint detection algorithm proposed by Cootes et al. (<xref ref-type="bibr" rid="B5">1995</xref>), it is a point distribution model based algorithm, which firstly obtains the training set by manual calibration, and then obtains the shape model after training, and then abstracts the target object through the shape model, and then achieves the face shape matching through the keypoint matching in the testing stage. Cootes et al. (<xref ref-type="bibr" rid="B4">1998</xref>) further improved the ASM algorithm and obtained the AAM algorithm, which takes the texture features of the face region into account while adopting the shape constraints, and establishes the texture model while building the shape model, and combines the two models to obtain the active epistemic model. Doll&#x000E1;r et al. (<xref ref-type="bibr" rid="B8">2010</xref>) put forward a classic work called the Cascaded Pose Regression (CPR), which is a method for matching the shape of the face. Cascaded Pose Regression model, which adopts a multi-stage cascade from coarse to fine learning idea to gradually improve the accuracy of keypoint locations through multiple iterations. This idea still influences many deep learning-based computer vision algorithms, such as Convolutional Pose Machines (CPM) (Wei et al., <xref ref-type="bibr" rid="B38">2016</xref>) and Stacked Hourglass Network (Newell et al., <xref ref-type="bibr" rid="B26">2016</xref>) in the field of human pose estimation, Cascaded R-CNN (Cai and Vasconcelos, <xref ref-type="bibr" rid="B2">2018</xref>) in target detection and so on. Although the above traditional methods based on face keypoint detection can achieve better detection results to a certain extent, they inevitably have the limitations of complex data processing, poor anti-interference ability and low computational efficiency.</p>
<p>To overcome these problems, deep learning-based face keypoint detection methods have emerged in recent years and have substantially outperformed traditional methods in face keypoint detection tasks. Sun et al. (<xref ref-type="bibr" rid="B35">2013</xref>) first proposed and employed a deep convolutional neural network, DCNN (Deep convolutional network) (Ren et al., <xref ref-type="bibr" rid="B31">2017</xref>), for face keypoint detection, proposing a three-stage coarse-to-fine cascade regression network, which achieved then-optimal results on several publicly available datasets. Currently, some scholars have applied deep learning-based keypoint detection techniques to face acupoint detection, and Zhang et al. (<xref ref-type="bibr" rid="B43">2023</xref>) constructed the face point dataset FAcupoint and proposed the FADbR facial point detection algorithm framework, which adequately extracts face features through the reconstruction task and reduces the model&#x00027;s dependence on labeled data. Berretti et al. (<xref ref-type="bibr" rid="B1">2011</xref>) conducted experiments on the BU-3DFE dataset to extract the local features of the face using the SIFT (Lowe, <xref ref-type="bibr" rid="B24">2004</xref>) model for keypoint detection and used a multi-class SVM (Platt, <xref ref-type="bibr" rid="B27">1998</xref>) for classification, and the experimental results showed that the method has a good performance in recognizing facial expressions. YOLO series algorithms, which use one-stage detection method, have many applications in keypoint detection by virtue of its simple network model and high accuracy rate. Maji et al. (<xref ref-type="bibr" rid="B25">2022</xref>) proposed the YOLO-pose algorithm for 2D multi-person pose keypoint estimation in images, achieving impressive results. On the MS COCO validation and test sets, the model achieved mAP&#x00040;0.5 values of 90.2% and 90.3%, respectively. Pranavan et al. (<xref ref-type="bibr" rid="B28">2023</xref>) applied YOLOv7-pose to keypoint detection for assessing falls in elderly individuals, achieving an accuracy of 89.6% and precision of 91.2%, demonstrating good detection performance. However, the aforementioned models still have drawbacks such as slow speed, poor performance in detecting small faces, difficulties in training, and relatively low model accuracy. Therefore, this research proposes three improvements to the original YOLOv8-pose model, aiming to both reduce model size and enhance the accuracy of acupoint recognition.</p>
<p>ECA-net (Wang et al., <xref ref-type="bibr" rid="B37">2020</xref>) is an improvement upon SE-net (Hu et al., <xref ref-type="bibr" rid="B12">2018</xref>), introducing a non-dimensional reduction local cross-channel interaction strategy. This strategy effectively utilizes one-dimensional convolution and employs ResNets (He et al., <xref ref-type="bibr" rid="B11">2016</xref>) and MobileNetV2 (Sandler et al., <xref ref-type="bibr" rid="B34">2018</xref>) as backbones. The proposed ECA module has been extensively evaluated in image classification, object detection, and instance segmentation. Experimental results demonstrate that the module outperforms other modules in terms of performance while maintaining high efficiency. In this research, the ECA attention mechanism is employed to enhance the capture of acupoint features, with a focus on improving these features.</p>
<p>Slim-neck (Li et al., <xref ref-type="bibr" rid="B19">2022</xref>) is used to balance model accuracy and speed. Originally applied to the SODA10M autonomous driving dataset, the Slim-neck detector shows significant improvements in speed and accuracy compared to the original detector. In this work, the Slim-neck module is substituted for the original neck module, enabling lightweight modeling while maintaining good detection performance.</p>
<p>GIoU (Rezatofighi et al., <xref ref-type="bibr" rid="B33">2019</xref>) is an improvement upon IoU (Yu et al., <xref ref-type="bibr" rid="B41">2016</xref>) and is utilized to optimize the non-overlapping regions. It has been verified that replacing IoU with GIoU significantly improves detection accuracy and is applicable to YOLO (Redmon et al., <xref ref-type="bibr" rid="B30">2016</xref>) algorithms and the Faster R-CNN (Ren et al., <xref ref-type="bibr" rid="B32">2015</xref>) series. In this research, GIoU is used as a loss function to enhance facial object detection capability and facial acupoint keypoint detection.</p>
</sec>
<sec id="s3">
<title>Material and methods</title>
<p>This section firstly introduces the improvement process of YOLOv8-pose, and then gives a brief introduction to the YOLOv8 keypoint detection algorithm in subsection 3.1, explaining the role and structure of each module. In subsection 3.2, it focuses on the improvement strategy of this research and gives a detailed description of each improved module in subsections 3.2.1, 3.2.2, and 3.2.3.</p>
<p>The YOLOv8-ACU critical point detection model and the improved experimental flow proposed in this research are shown in <xref ref-type="fig" rid="F1">Figure 1</xref>, including the following ten steps.</p>
<list list-type="bullet">
<list-item><p>Step 1: Select 608 front face photos from WIDER Face public dataset as the dataset for this experiment.</p></list-item>
<list-item><p>Step 2: Use labelme software to manually label 11 types of acupoints.</p></list-item>
<list-item><p>Step 3: Divide the dataset into training and validation sets.</p></list-item>
<list-item><p>Step 4: Create an initial model of YOLOv8-pose for subsequent improvement of it.</p></list-item>
<list-item><p>Step 5: YOLOv8-ACU model
<list list-type="simple">
<list-item><p>- Sub-step 5.1: Add ECA attention mechanism to the backbone part of the original model.</p></list-item>
<list-item><p>- Sub-step 5.2: Replace the original model&#x00027;s neck module with a lighter weight Slim-neck.</p></list-item>
<list-item><p>- Sub-step 5.3: Change the loss function to GIoU.</p></list-item>
</list></p></list-item>
<list-item><p>Step 6: Fine-tune the original parameters in the model and train the data using YOLOv8-ACU.</p></list-item>
<list-item><p>Step 7: Save the optimal model generated by the training process and evaluate the model performance on the validation set.</p></list-item>
<list-item><p>Step 8: Collect additional facial image data as an external test set to complete the data labeling.</p></list-item>
<list-item><p>Step 9: Apply external test set for model performance evaluation and the results are given in subsection 4.5.3.</p></list-item>
<list-item><p>Step 10: Compare the evaluation results of the original model and the improved model detection, and output the model evaluation results.</p></list-item>
</list>
<fig id="F1" position="float">
<label>Figure 1</label>
<caption><p>Experimental steps of keypoint detection model for acupoints.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnbot-18-1355857-g0001.tif"/>
</fig>
<sec>
<title>YOLOv8 keypoint detection algorithm</title>
<p>YOLOv8 (Jocher et al., <xref ref-type="bibr" rid="B16">2020</xref>) is the latest detection algorithm introduced in the current YOLO series of algorithms, which is suitable for tasks such as target detection, image classification and instance segmentation. In this research, we focus on keypoint detection, and choose the smaller but more accurate YOLOv8n as the base model. The detection network of YOLOv8n is divided into four parts: Input, Backbone, Neck, and Head.</p>
<p><italic>Input:</italic> The part is responsible for scaling the input image to the size needed for training, and carrying out data preprocessing and enhancement operations. Preprocessing includes normalization and scaling of images, ensuring consistency in the input size and pixel value range. For data enhancement, techniques such as Scaling, Tone Adjustment, Mosaic augmentation, and random transformations like cropping, rotating, and flipping are employed. The anchor-free mechanism is also adopted here to predict the center of the object directly, reducing the complexity and dependence on predefined anchor sizes and shapes.</p>
<p><italic>Backbone:</italic> The backbone is used for feature extraction and contains Conv, C2f and SPPF modules. The new C2f structure applies residual features for learning, which enriches the gradient flow information; SPPF is called Spatial Pyramid Pooling, which converts an arbitrarily sized feature map into a fixed-size feature vector.</p>
<p><italic>Neck:</italic> The structure of the neck follows the Feature Pyramid Network (FPN) (Lin et al., <xref ref-type="bibr" rid="B22">2017</xref>) and the Path Aggregation Network (PAN) (Liu et al., <xref ref-type="bibr" rid="B23">2018</xref>) effectively integrating the top-down and bottom-up information flow in the network and enhancing the detection performance.</p>
<p><italic>Head:</italic> The head section utilizes different-sized feature maps to obtain category and position information for objects of varying sizes. It applies the concept of Distributional Focal Loss (DFL) (Qian et al., <xref ref-type="bibr" rid="B29">2020</xref>), reducing the parameter size and computational complexity. The YOLOv8 series of models perform well in terms of detection accuracy and speed, and in this research, YOLOv8n is used as the basis for improvement to further enhance the detection performance.</p>
</sec>
<sec>
<title>YOLOv8-ACU facial acupoint detection algorithm</title>
<p>The initial model of YOLOv8-pose is a keypoint detection model for human posture recognition. Since there are some differences in features between facial acupoint keypoint detection and human posture keypoint detection, and the detection of facial acupoints requires higher accuracy, this research improves the original YOLOv8-pose model, aiming to make it have the potential for clinical applications in the future. Because the distribution of facial acupoints is relatively dense, an effective ECA attention mechanism needs to be introduced into the feature extraction network of the backbone to enhance the feature representation capability and focus more attention on each acupoint, and the ECA attention mechanism is able to reduce the redundant computation while fully considering the global information, thus improving the performance and robustness of the model. Adopting Slim-neck instead of the original neck structure, by fusing the features of different layers, the network&#x00027;s ability to detect objects of different scales can be effectively improved, so as to reduce the detection error of the acupoints due to the change of the object&#x00027;s scale, and the Slim-neck can reduce the computational complexity of the model while improving the model&#x00027;s accuracy. Meanwhile, during the experiment, the loss function is further modified to use GIoU as the loss function. Its network structure is shown in <xref ref-type="fig" rid="F2">Figure 2</xref>.</p>
<fig id="F2" position="float">
<label>Figure 2</label>
<caption><p>YOLOv8-ACU model structure.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnbot-18-1355857-g0002.tif"/>
</fig>
<sec>
<title>ECA attention mechanism</title>
<p>The main idea behind attention mechanisms is &#x0201C;dynamic weighting,&#x0201D; which assigns higher weights to important information and lower weights to relatively irrelevant information (Deng et al., <xref ref-type="bibr" rid="B7">2023</xref>). As a new and efficient channel attention mechanism, the ECA attention mechanism mainly improves the SE attention mechanism, and achieves performance improvement through the local cross-channel interaction strategy without dimensionality reduction and adaptive selection of one-dimensional convolutional kernel size. Its specific steps are as follows:</p>
<list list-type="bullet">
<list-item><p>Step 1: Perform global average pooling operation on the input feature map</p></list-item>
<list-item><p>Step 2: Conduct a 1D convolution operation with a kernel size of k, followed by a Sigmoid (Elfwing et al., <xref ref-type="bibr" rid="B9">2018</xref>) activation function to obtain weights w for each channel.</p></list-item>
<list-item><p>Step 3: The weights are multiplied with the corresponding elements of the original input feature map to obtain the final output features.</p></list-item>
</list>
<p>Incorporating the ECA attention mechanism into the backbone structure of YOLOv8-pose enables the neural network to pay more attention to the feature acquisition of acupoint locations and reduce the acquisition of other information beyond the face. Its flowchart is shown in <xref ref-type="fig" rid="F3">Figure 3</xref>.</p>
<fig id="F3" position="float">
<label>Figure 3</label>
<caption><p>Flowchart of the ECA attention mechanism.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnbot-18-1355857-g0003.tif"/>
</fig>
</sec>
<sec>
<title>Slim-neck module</title>
<p>In order to accelerate the computation of the prediction, the input images in the convolutional neural network almost always need to undergo the following transformation process: the spatial information is gradually transferred to the channels, and each time the spatial (width and height) compression of the feature maps and the expansion of the channels lead to a partial loss of the semantic information, which makes the feature extraction for the acupuncture point recognition incomplete. Therefore, in this research, Slim-neck module is introduced to replace the original neck module in YOLOv8-pose in order to preserve as many hidden connections of each channel as possible.</p>
<p>Firstly, the traditional convolutional Conv is replaced in Slim-neck with the lightweight GSConv, a convolutional operation based on global pooling and group sparse concatenation, which improves the expressive power of the model while reducing the amount of computation by dividing the input channels into groups and performing independent convolutional operations on each group. The GSbottleneck module and VoV-GSCSP module are introduced on the basis of GSConv. The structure of VoV-GSCSP is shown in <xref ref-type="fig" rid="F4">Figure 4</xref>. Among them, the VoV-GSCSP module uses the one-time aggregation method to design the cross-level partial network, and replaces the CSP module in the original neck with it, which reduces the amount of model computation and reduces the complexity of the network structure while maintaining sufficient accuracy. Slim-neck realizes the reconstruction of the neck module of YOLOv8-pose by combining GSConv and VoV-GSCSP, which is more conducive to the extraction and categorization of acupoint features, and also improves the accuracy of acupoint recognition while reducing the amount of model computation.</p>
<fig id="F4" position="float">
<label>Figure 4</label>
<caption><p>Structure of VoV-GSCSP.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnbot-18-1355857-g0004.tif"/>
</fig>
</sec>
<sec>
<title>Improvement of the loss function</title>
<p>YOLOv8-pose fuses the target detection task and keypoint detection task together, so the accuracy of keypoint detection also depends on the accuracy of target detection to some extent, this research uses the GIoU loss function to replace the CIoU loss function on the target detection task (Zheng et al., <xref ref-type="bibr" rid="B47">2020</xref>). The GIoU loss function, as an improved form of IoU, focuses not only on the overlapping region of the detection frame, but also on other non-overlapping regions, which can better reflect the overlap between the two. The formula for GIoU calculation is as follows:</p>
<disp-formula id="E1"><label>(1)</label><mml:math id="M1"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mi>G</mml:mi><mml:mi>I</mml:mi><mml:mi>o</mml:mi><mml:mi>U</mml:mi><mml:mo>=</mml:mo><mml:mi>I</mml:mi><mml:mi>o</mml:mi><mml:mi>U</mml:mi><mml:mo>-</mml:mo><mml:mfrac><mml:mrow><mml:mi>C</mml:mi><mml:mo>-</mml:mo><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>B</mml:mi><mml:mo>&#x0222A;</mml:mo><mml:msup><mml:mrow><mml:mi>B</mml:mi></mml:mrow><mml:mrow><mml:mi>g</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msup></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mrow><mml:mi>C</mml:mi></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>where C is the minimum circumscribed matrix area, B is the target prediction frame; <italic>B</italic><sup><italic>gt</italic></sup> is the ground-truth frame,according to Equation <xref ref-type="disp-formula" rid="E1">(1)</xref>.</p>
</sec>
</sec>
</sec>
<sec sec-type="results" id="s4">
<title>Results</title>
<sec>
<title> Facial acupuncture point detection dataset</title>
<p>In the research, experiments are conducted using Class I dataset and Class II dataset, where Class I dataset is used for training and validation of the model, while Class II dataset is used for testing of the model to evaluate and test the generalization ability of the model.</p>
<p><italic>Class I dataset:</italic> The Class I dataset is constructed based on the publicly available WIDER Face dataset (Yang et al., <xref ref-type="bibr" rid="B40">2016</xref>), selecting 608 images with frontal faces and limited occlusions for labeling 11 types of facial acupoints. To ensure the accuracy of annotation, three acupuncturists, each with over 20 years of extensive clinical experience and who have undergone regular training and updates, were invited to locate acupoints based on the International Standards of Acupuncture Points published by the WHO (World Health Organization Regional Office for the Western Pacific, <xref ref-type="bibr" rid="B39">2008</xref>). In cases of disagreement, the principle of the minority conforming to the majority was adopted. If opinions were completely divergent, a consensus was reached through case study analysis and literature review discussions before proceeding with the localization. This process ultimately led to the formation of a Class I self-constructed dataset, Acupoint-I. During model training, the Acupoint-I dataset was divided into training and validation sets using an 8:2 ratio.</p>
<p><italic>Class II dataset:</italic> The Class II dataset is an external dataset utilized by our team specifically for model testing. It consists of 236 frontal face photographs of diverse individuals, sourced both from the internet and the SCUT-FBP5500 public dataset. This dataset encompasses a balanced representation of adult males and females from both Asian and Caucasian ethnicities, with a deliberate 1:1 gender ratio maintained in the selection process. These images were annotated with acupoints by the three acupuncturists mentioned earlier, using the same methodology as that for the Class I dataset, leading to the formation of the self-constructed Class II dataset, Acupoint-II. Distinct from the model&#x00027;s training phase, the Class II dataset is exclusively deployed during the model evaluation stage. Its primary role is to accurately assess the model&#x00027;s generalization capabilities over unseen data and is not involved in the training process, ensuring no potential influence on the model&#x00027;s performance.</p>
<p><italic>Introduction to acupuncture points:</italic> In the world, acupuncture has become an indispensable part of daily medical practice and is now a widely used therapeutic modality in medicine (Chon and Lee, <xref ref-type="bibr" rid="B3">2013</xref>). Following the guidance of the principle of syndrome differentiation and treatment, the selection of appropriate acupoints and their compatibility is a prerequisite for acupuncture treatment and a strong guarantee for improving clinical efficacy (Tian, <xref ref-type="bibr" rid="B36">2010</xref>). Based on the experiences of Yu et al. (<xref ref-type="bibr" rid="B42">2021</xref>) and Zheng et al. (<xref ref-type="bibr" rid="B45">2009</xref>) in selecting acupoints for the treatment of peripheral facial paralysis, we finally selected Zanzhu (ST2), Sibai (ST7), Jiache (EX-HN19), Dicang (ST4), Taiyang (EX-HN4), and Quanliu (SI18) as main acupoints and Yuyao (EX-HN5), Yingxiang (LI20), Kouheliao (LI19), Jiachengjiang (ST6), and Jiache (EX-HN19) as complementary acupoints. The medical positioning of these 11 acupoints is as follows (as shown in <xref ref-type="fig" rid="F5">Figure 5</xref>), according to the International Organisation for Standardization (<xref ref-type="bibr" rid="B13">2021</xref>):</p>
<list list-type="bullet">
<list-item><p><italic>Xiaguan (BL2):</italic> Located in the depression between the central part of the lower edge of the zygomatic arch and the infraorbital margin.</p></list-item>
<list-item><p><italic>Taiyang (EX-HN4):</italic> Located at the depression approximately one horizontal finger&#x00027;s width (middle finger) posterior to the midpoint between the lateral end of the eyebrow and the outer canthus.</p></list-item>
<list-item><p><italic>Yuyao (EX-HN5):</italic> Located at the center of the eyebrow, directly above the pupil, with a tender sensation upon pressure.</p></list-item>
<list-item><p><italic>Zanzhu (ST2):</italic> Located in the depression at the medial end of the eyebrow, along the brow margin.</p></list-item>
<list-item><p><italic>Sibai (ST7):</italic> Located at the lower border of the zygomatic arch.</p></list-item>
<list-item><p><italic>Quanliu (SI18):</italic> Located in the depression below the zygomatic bone and directly below the lateral canthus.</p></list-item>
<list-item><p><italic>Yingxiang (LI20):</italic> Located at the side of the face, beside the midpoint of the nasolabial groove.</p></list-item>
<list-item><p><italic>Kouheliao (LI19):</italic> Located at the outer edge of the nostril, one-third of the distance from the upper to the lower part of the philtrum groove.</p></list-item>
<list-item><p><italic>Jiachengjiang (ST6):</italic> Located at a point one inch away on each side of the midpoint of the mental groove, parallel to Jiacheng (ST6).</p></list-item>
<list-item><p><italic>Dicang (ST4):</italic> Located at the side of the mouth, 0.4 cun (1 cun &#x02248; the width of the middle joint of the thumb) away from the corner of the mouth.</p></list-item>
<list-item><p><italic>Jiache (EX-HN19):</italic> Located approximately one horizontal finger&#x00027;s width (middle finger) above the anterior angle of the mandible.</p></list-item>
</list>
<fig id="F5" position="float">
<label>Figure 5</label>
<caption><p>Introduction to acupuncture points.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnbot-18-1355857-g0005.tif"/>
</fig>
</sec>
<sec>
<title>Comparison with previous works</title>
<p><italic>Comparison with YOLO-pose:</italic> YOLO-pose is improved based on YOLOv5 model and its basic structure is similar to YOLOv5. In the backbone of YOLOv8-ACU model, the CSP idea is still adopted. In order to achieve further lightweighting of the model, the C2f module is introduced to replace the C3 module in YOLOv5. In addition despite some architectural optimization and improvements in YOLOv8, it still retains the SPPF module in the YOLOv5 architecture, which helps to enhance the feature extraction capability of the model.</p>
<p>YOLOv5 adopts the Coupled head &#x0002B; Anchor-based approach for the head part, while YOLOv8 utilizes the Decoupled head &#x0002B; Anchor-free approach. As a result, YOLOv8&#x00027;s decoupling of the detection head from the anchor boxes enhances the adaptability to objects of different scales, leading to improved detection performance (as shown in <xref ref-type="fig" rid="F6">Figure 6</xref>).</p>
<fig id="F6" position="float">
<label>Figure 6</label>
<caption><p>Comparison of mAP&#x00040;0.5 and mAP&#x00040;0.5&#x02013;0.95 results for four models.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnbot-18-1355857-g0006.tif"/>
</fig>
<p>Experimental results have shown that, with a batch size of 4, the YOLO-pose model achieves a default configuration and initial parameters that results in mAP&#x00040;0.5 value of 92.90% for acupoint keypoint detection task. Under the same settings, YOLOv8-pose, with the application of AdamW, achieves an mAP&#x00040;0.5 value of 95.70%. Furthermore, the parameter count of YOLOv8-ACU reduces from 7.2M in YOLO-pose to 2.96M, while the computational load decreases from 16.8 GFLOPs in YOLO-pose to 8.8 GFLOPs in YOLOv8-ACU. This indicates that YOLOv8-ACU not only improves the detection performance, but also makes the model more lightweight and efficient.</p>
<p><italic>Comparison with YOLOv7-pose:</italic> The C2F module in YOLOv8 is inspired by the E-ELAN module in YOLOv7, which enhances the gradient flow in the model by fusing different feature maps from multiple branch cross-layer networks. YOLOv8 achieves lightweight modeling by utilizing depth-wise separable convolution layers to reduce the parameter size and computational load.</p>
<p>In our experimental setup, when the batch size is set to 4, applying YOLOv7-pose for acupoint keypoint detection yields an mAP&#x00040;0.5 of 94.9%. However, under the same settings, YOLOv8-pose achieves an mAP&#x00040;0.5 of 97.5%.</p>
<p>Alongside the improvement in accuracy, YOLOv8-ACU significantly reduces the parameter count from 80.3M in YOLOv7 to 2.96M, a reduction of nearly 26 times, while the computational load decreases from 101.8GFLOPs to 8.8GFLOPs, a decrease of 91%. Considering the overall detection performance and model complexity, YOLOv8-ACU maintains a high mAP value while experiencing a significant reduction in parameters and computational load, making it more suitable for real-world deployment. Therefore, compared to YOLOv7-pose, YOLOv8-ACU achieves both accuracy and efficiency improvements in acupoint keypoint detection tasks, making it more applicable in practical scenarios (as shown in <xref ref-type="fig" rid="F6">Figure 6</xref>).</p>
</sec>
<sec>
<title>Implementing tools and model parameters</title>
<p>The training iteration period is set to 75, the batch size is set to 4, the optimiser is chosen to be AdamW, the initial learning rate is set to 0.01, and the momentum factor to 0.937.</p>
</sec>
<sec>
<title>Evaluation metrics</title>
<p>In the research, P (Precision) and R (Recall) are used as evaluation indexes for target detection. The calculation method of the indexes is as follows.</p>
<p>Precision is the proportion of positive class targets detected by the model that are truly positive class targets. In target detection, precision represents the ratio of targets correctly detected by the model to all bounding boxes detected as targets by the model. The calculation formula is Equation <xref ref-type="disp-formula" rid="E2">(2)</xref>:</p>
<disp-formula id="E2"><label>(2)</label><mml:math id="M2"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mi>P</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mi>F</mml:mi><mml:mi>P</mml:mi></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>Recall is the ratio of positive class targets detected by the model to the actual positive class targets, according to Equation <xref ref-type="disp-formula" rid="E3">(3)</xref>. In target detection, the recall rate represents the ratio of targets correctly detected by the model to the bounding boxes of all true positive class targets.</p>
<disp-formula id="E3"><label>(3)</label><mml:math id="M3"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mi>R</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mi>F</mml:mi><mml:mi>N</mml:mi></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>In keypoint detection, this study uses the official MS COCO given based on the object keypoint similarity <italic>L</italic><sub><italic>oks</italic></sub> (object keypoint similarity) (Maji et al., <xref ref-type="bibr" rid="B25">2022</xref>) The average accuracy mean of the validation criteria is used as the evaluation metric. Where <italic>L</italic><sub><italic>oks</italic></sub> is denoted as Equation <xref ref-type="disp-formula" rid="E4">(4)</xref>:</p>
<disp-formula id="E4"><label>(4)</label><mml:math id="M4"><mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>o</mml:mi><mml:mi>k</mml:mi><mml:mi>s</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mstyle displaystyle='true'><mml:msub><mml:mo>&#x02211;</mml:mo><mml:mi>i</mml:mi></mml:msub><mml:mrow><mml:mrow><mml:mo>[</mml:mo><mml:mrow><mml:msup><mml:mrow><mml:mi>exp</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mo>&#x02212;</mml:mo><mml:mfrac><mml:mrow><mml:msubsup><mml:mi>d</mml:mi><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow><mml:mrow><mml:mn>2</mml:mn><mml:msup><mml:mi>s</mml:mi><mml:mn>2</mml:mn></mml:msup><mml:msubsup><mml:mi>k</mml:mi><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:mfrac></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:msup><mml:mi>&#x003B4;</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:msub><mml:mi>v</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x0003E;</mml:mo><mml:mn>0</mml:mn></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow><mml:mo>]</mml:mo></mml:mrow></mml:mrow></mml:mstyle></mml:mrow><mml:mrow><mml:mstyle displaystyle='true'><mml:msub><mml:mo>&#x02211;</mml:mo><mml:mi>i</mml:mi></mml:msub><mml:mrow><mml:mi>&#x003B4;</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:msub><mml:mi>v</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x0003E;</mml:mo><mml:mn>0</mml:mn></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mstyle></mml:mrow></mml:mfrac></mml:mrow></mml:math></disp-formula>
<p>where <italic>i</italic> is the labeled keypoint number;<inline-formula><mml:math id="M5"><mml:msubsup><mml:mrow><mml:mi>d</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msubsup></mml:math></inline-formula> is the square of the Euclidean distance between the detected keypoint location and the true keypoint location;<italic>s</italic><sup>2</sup> is the area occupied by the detected body in the image;<italic>k</italic><sub><italic>i</italic></sub> is the decay constant used to control the keypoint category<italic>i</italic> of the attenuation constant;&#x003B4; is the impulse function, indicating that it computes the value only for the visible keypoints <italic>L</italic><sub><italic>oks</italic></sub> in the true annotations;<italic>v</italic><sub><italic>i</italic></sub> is the value of the visibility of the <italic>i</italic>-th keypoint (<italic>v</italic><sub><italic>i</italic></sub>&#x0003E;0 indicates that the keypoint is visible).</p>
<disp-formula id="E5"><label>(5)</label><mml:math id="M6"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mi>P</mml:mi><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi><mml:mi>i</mml:mi><mml:mi>s</mml:mi><mml:mi>i</mml:mi><mml:mi>o</mml:mi><mml:msub><mml:mrow><mml:mi>n</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi><mml:mi>p</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mtext>&#x000A0;</mml:mtext><mml:mfrac><mml:mrow><mml:mi>T</mml:mi><mml:msub><mml:mrow><mml:mi>P</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi><mml:mi>p</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:msub><mml:mrow><mml:mi>P</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi><mml:mi>p</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>&#x0002B;</mml:mo><mml:mi>F</mml:mi><mml:msub><mml:mrow><mml:mi>P</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi><mml:mi>p</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<disp-formula id="E6"><label>(6)</label><mml:math id="M7"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mi>R</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi><mml:mi>a</mml:mi><mml:mi>l</mml:mi><mml:msub><mml:mrow><mml:mi>l</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi><mml:mi>p</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mtext>&#x000A0;</mml:mtext><mml:mfrac><mml:mrow><mml:mi>T</mml:mi><mml:msub><mml:mrow><mml:mi>P</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi><mml:mi>p</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:msub><mml:mrow><mml:mi>P</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi><mml:mi>p</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>&#x0002B;</mml:mo><mml:mi>F</mml:mi><mml:msub><mml:mrow><mml:mi>N</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi><mml:mi>p</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<disp-formula id="E7"><label>(7)</label><mml:math id="M8"><mml:mrow><mml:mi>A</mml:mi><mml:mi>P</mml:mi><mml:mo>=</mml:mo><mml:mtext>&#x000A0;</mml:mtext><mml:mstyle displaystyle='true'><mml:mrow><mml:msubsup><mml:mo>&#x0222B;</mml:mo><mml:mn>0</mml:mn><mml:mn>1</mml:mn></mml:msubsup><mml:mrow><mml:mi>P</mml:mi><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi><mml:mi>i</mml:mi><mml:mi>s</mml:mi><mml:mi>i</mml:mi><mml:mi>o</mml:mi><mml:msub><mml:mi>n</mml:mi><mml:mrow><mml:mi>k</mml:mi><mml:mi>p</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mi>d</mml:mi><mml:mi>R</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi><mml:mi>a</mml:mi><mml:mi>l</mml:mi><mml:msub><mml:mi>l</mml:mi><mml:mrow><mml:mi>k</mml:mi><mml:mi>p</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mrow></mml:mstyle></mml:mrow></mml:math></disp-formula>
<disp-formula id="E8"><label>(8)</label><mml:math id="M9"><mml:mrow><mml:mi>m</mml:mi><mml:mi>A</mml:mi><mml:mi>P</mml:mi><mml:mo>=</mml:mo><mml:mtext>&#x000A0;</mml:mtext><mml:mfrac><mml:mrow><mml:mstyle displaystyle='true'><mml:msubsup><mml:mo>&#x02211;</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>N</mml:mi></mml:msubsup><mml:mrow><mml:mi>A</mml:mi><mml:msub><mml:mi>P</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mstyle></mml:mrow><mml:mi>N</mml:mi></mml:mfrac></mml:mrow></mml:math></disp-formula>
<p><italic>TP</italic><sub><italic>kpt</italic></sub>(True Positives) occurs when acupoints are correctly identified, with their predicted keypoints showing an <italic>L</italic><sub><italic>oks</italic></sub> above the threshold in comparison to actual acupoint keypoints. <italic>FP</italic><sub><italic>kpt</italic></sub>(False Positives) arises when non-acupoint areas are incorrectly identified as acupoints, indicated by predicted keypoints exceeding the <italic>L</italic><sub><italic>oks</italic></sub> threshold. <italic>FN</italic><sub><italic>kpt</italic></sub>(False Negatives) represents situations where actual acupoint keypoints are missed because the corresponding predicted keypoints do not meet the required <italic>L</italic><sub><italic>oks</italic></sub> threshold. The AP value is the area of the P-R curve according to Equation <xref ref-type="disp-formula" rid="E5">(5)</xref>-<xref ref-type="disp-formula" rid="E7">(7)</xref>. mAP&#x00040;0.5 is the average of the AP values for all categories at a threshold of 0.5. mAP&#x00040;0.5&#x02013;0.95 considers a range of different <italic>L</italic><sub><italic>oks</italic></sub> thresholds, from 0.5 to 0.95, at intervals of 0.05 (for example, 0.5, 0.55, 0.6, &#x02026;, 0.95), and calculates the average of the AP values at these varying thresholds according to Equation <xref ref-type="disp-formula" rid="E8">(8)</xref>.</p>
<p>Additionally, this study selects the GFLOPs and the number of Parameters as evaluation criteria to measure the size of the model.</p>
</sec>
<sec>
<title>Experimental results and analysis</title>
<sec>
<title>Comparative experiments on keypoint detection models</title>
<p>To assess the comparison between YOLOv8-pose and other keypoint detection models, this study selected four different models for comparative experiments: YOLO-pose, YOLOv7-pose, YOLOv8-pose, and YOLOv8-ACU. The experimental results for each model are shown in the table above. From the experimental results, it was found that when using pretrained models, YOLO-pose achieved 92.90% in mAP&#x00040;0.5 and 50.60% in mAP&#x00040;0.5&#x02013;0.95, while YOLOv7-pose achieved 94.90% in mAP&#x00040;0.5 and 54.90% in mAP&#x00040;0.5&#x02013;0.95. It can be observed that both YOLO-pose and YOLOv7-pose perform exceptionally well in terms of accuracy, but their model parameters and computational complexity are quite high.</p>
<p>On the other hand, YOLOv8-ACU outperforms other models in various aspects. Even when YOLO-pose and YOLOv7-pose are equipped with pretrained weights, they still cannot match the keypoint prediction accuracy of YOLOv8-ACU. Moreover, in clinical applications of facial acupoint detection, a higher recognition accuracy is typically required. Therefore, after incorporating Slim-neck, ECA attention mechanism, and more suitable loss functions, YOLOv8 achieved a 1.8% improvement in mAP&#x00040;0.5 and a 3.1% improvement in mAP&#x00040;0.5&#x02013;0.95 compared to the original YOLOv8-pose. These improvements represent significant advancements in accuracy. Additionally, as shown in <xref ref-type="table" rid="T2">Table 2</xref>, YOLOv8-ACU has the smallest number of parameters and computational complexity among these four models, making its lightweight design more suitable for real-world clinical practice.</p>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p>Comparative experiments.</p></caption>
<table frame="box" rules="all">
<thead>
<tr style="background-color:#919498;color:#ffffff">
<th valign="top" align="left"><bold>Model</bold></th>
<th valign="top" align="center"><bold>Pre-trained</bold></th>
<th valign="top" align="center"><bold>mAP&#x00040;0.5/%</bold></th>
<th valign="top" align="center"><bold>mAP&#x00040;0.5&#x02013;0.95/%</bold></th>
<th valign="top" align="center"><bold>Parameters</bold></th>
<th valign="top" align="center"><bold>GFLOPs</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">YOLO-pose</td>
<td valign="top" align="center">Yes</td>
<td valign="top" align="center">92.90%</td>
<td valign="top" align="center">50.60%</td>
<td valign="top" align="center">7231912</td>
<td valign="top" align="center">16.8</td>
</tr>
<tr>
<td valign="top" align="left">YOLOv7-pose</td>
<td valign="top" align="center">Yes</td>
<td valign="top" align="center">94.90%</td>
<td valign="top" align="center">54.90%</td>
<td valign="top" align="center">80293736</td>
<td valign="top" align="center">101.8</td>
</tr>
<tr>
<td valign="top" align="left">YOLOv8-pose</td>
<td valign="top" align="center">No</td>
<td valign="top" align="center">95.70%</td>
<td valign="top" align="center">73.80%</td>
<td valign="top" align="center">3403229</td>
<td valign="top" align="center">9.7</td>
</tr>
<tr>
<td valign="top" align="left">YOLOv8-ACU</td>
<td valign="top" align="center">No</td>
<td valign="top" align="center">97.50%</td>
<td valign="top" align="center">76.90%</td>
<td valign="top" align="center">2962560</td>
<td valign="top" align="center">8.8</td>
</tr></tbody>
</table>
</table-wrap>
</sec>
<sec>
<title>Ablation experiment</title>
<p>According to the ablation experiments in <xref ref-type="fig" rid="F7">Figure 7</xref>, it can be observed that adding the ECA attention mechanism improved the Recall by 3.1% and mAP&#x00040;0.5 by 0.9%. Adding the GIoU loss function increased the Recall by 0.2%, mAP&#x00040;0.5 by 0.2%, and mAP&#x00040;0.5&#x02013;0.95 by 1.4%. Integrating the lightweight structure, Slim-neck, improved Precision by 2.2%, mAP&#x00040;0.5 by 0.7%, and mAP&#x00040;0.5&#x02013;0.95 by 2.9%. Additionally, the model Parameters, Model Size, and GFLOPs decreased by 0.44M, 0.82MB, and 9.3%, respectively. From the loss function variation curve in <xref ref-type="fig" rid="F8">Figure 8</xref>, it can be observed that changing the loss function to GIoU Loss resulted in faster model convergence and improved accuracy.</p>
<fig id="F7" position="float">
<label>Figure 7</label>
<caption><p>Comparison of results from precision, recall, mAP&#x00040;0.5, and mAP&#x00040;0.5&#x02013;0.95.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnbot-18-1355857-g0007.tif"/>
</fig>
<fig id="F8" position="float">
<label>Figure 8</label>
<caption><p>Variation curves of loss function for ablation experiments.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnbot-18-1355857-g0008.tif"/>
</fig>
<p>The experimental results in <xref ref-type="table" rid="T3">Table 3</xref> demonstrate that compared to the original YOLOv8-pose network model, the proposed YOLOv8-ACU model achieved improvements in Precision (&#x0002B;0.2%), Recall (&#x0002B;2.0%), mAP&#x00040;0.5 (&#x0002B;1.8%), and mAP&#x00040;0.5&#x02013;0.95 (&#x0002B;3.1%). Additionally, the Parameters, Model Size, and GFLOPs of the model decreased by 0.44M, 0.82MB, and 9.3%, respectively, validating the effectiveness of the proposed algorithm improvements.</p>
<table-wrap position="float" id="T3">
<label>Table 3</label>
<caption><p>Ablation experiment.</p></caption>
<table frame="box" rules="all">
<thead>
<tr style="background-color:#919498;color:#ffffff">
<th valign="top" align="left"><bold>ECA</bold></th>
<th valign="top" align="center"><bold>GIoU</bold></th>
<th valign="top" align="center"><bold>SlimNeck</bold></th>
<th valign="top" align="center"><bold>Precision /%</bold></th>
<th valign="top" align="center"><bold>Recall /%</bold></th>
<th valign="top" align="center"><bold>mAP&#x00040;0.5 /%</bold></th>
<th valign="top" align="center"><bold>mAP&#x00040;0.5&#x02013;0.95/%</bold></th>
<th valign="top" align="center"><bold>Parameters /M</bold></th>
<th valign="top" align="center"><bold>ModelSize /MB</bold></th>
<th valign="top" align="center"><bold>GFLOPs</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">X</td>
<td valign="top" align="center">X</td>
<td valign="top" align="center">X</td>
<td valign="top" align="center">92.0</td>
<td valign="top" align="center">95.0</td>
<td valign="top" align="center">95.7</td>
<td valign="top" align="center">73.8</td>
<td valign="top" align="center">3.40</td>
<td valign="top" align="center">6.87</td>
<td valign="top" align="center">9.7</td>
</tr>
<tr>
<td valign="top" align="left">&#x02713;</td>
<td valign="top" align="center">X</td>
<td valign="top" align="center">X</td>
<td valign="top" align="center">90.8</td>
<td valign="top" align="center">98.1</td>
<td valign="top" align="center">96.6</td>
<td valign="top" align="center">72.6</td>
<td valign="top" align="center">3.40</td>
<td valign="top" align="center">6.87</td>
<td valign="top" align="center">9.7</td>
</tr>
<tr>
<td valign="top" align="left">&#x02713;</td>
<td valign="top" align="center">&#x02713;</td>
<td valign="top" align="center">X</td>
<td valign="top" align="center">90.0</td>
<td valign="top" align="center">98.3</td>
<td valign="top" align="center">96.8</td>
<td valign="top" align="center">74.0</td>
<td valign="top" align="center">3.40</td>
<td valign="top" align="center">6.87</td>
<td valign="top" align="center">9.7</td>
</tr>
<tr>
<td valign="top" align="left">&#x02713;</td>
<td valign="top" align="center">&#x02713;</td>
<td valign="top" align="center">&#x02713;</td>
<td valign="top" align="center">92.2</td>
<td valign="top" align="center">97.0</td>
<td valign="top" align="center">97.5</td>
<td valign="top" align="center">76.9</td>
<td valign="top" align="center">2.96</td>
<td valign="top" align="center">6.05</td>
<td valign="top" align="center">8.8</td>
</tr></tbody>
</table>
</table-wrap>
</sec>
<sec>
<title>Verification of external test sets</title>
<p>To test the improved model&#x00027;s generalization ability and effectiveness in clinical applications, in the research, we employed an external test set consisting of frontal face photos in approximate real-world scenarios for independent model validation. The model, as shown in <xref ref-type="table" rid="T4">Table 4</xref>, achieved Precision of 99.6%, Recall of 99.8%, mAP&#x00040;0.5 of 99.5%, and mAP&#x00040;0.5&#x02013;0.95 of 80.7%, surpassing the performance on the Class I dataset. This demonstrates that the improved model exhibits strong generalization capabilities when handling real-world data, which is crucial for its application in actual clinical environments. In specific clinical scenarios where physicians are involved, the model must accurately identify frontal face photos to support acupuncture or massage therapies. Therefore, the improved model can effectively locate 11 facial acupoints and assist healthcare professionals in intelligent acupoint recognition during clinical practice.</p>
<table-wrap position="float" id="T4">
<label>Table 4</label>
<caption><p>Test set validation results.</p></caption>
<table frame="box" rules="all">
<thead>
<tr style="background-color:#919498;color:#ffffff">
<th valign="top" align="left"><bold>Precision/%</bold></th>
<th valign="top" align="center"><bold>Recall/%</bold></th>
<th valign="top" align="center"><bold>mAP&#x00040;0.5/%</bold></th>
<th valign="top" align="center"><bold>mAP&#x00040;0.5:0.95/%</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">99.6</td>
<td valign="top" align="center">99.8</td>
<td valign="top" align="center">99.5</td>
<td valign="top" align="center">80.7</td>
</tr></tbody>
</table>
</table-wrap>
</sec>
<sec>
<title>Acupoint detection results</title>
<p>As shown in <xref ref-type="fig" rid="F9">Figure 9</xref> (red dots indicate predicted acupoint locations and green dots indicate true acupoint locations; it is important to note that subtle differences in the sizes of the acupoint dots are due to the varying resolutions of the images), through the comparison of the detection effects of YOLOv8-pose and YOLOv8-ACU, it can be found that the detection effects of YOLOv8-ACU and YOLOv8-pose on acupoints both present a good level of recognition, and most of the detection effects of YOLOv8-ACU on acupoints are better than that of YOLOv8-pose, and the relative positions of the predicted acupoints and the actual ones are also closer. Positions are also closer to each other as shown in <xref ref-type="fig" rid="F10">Figure 10</xref>. <xref ref-type="fig" rid="F10">Figure 10</xref> shows the results of the validation of YOLOv8-ACU on the images in the external dataset, since the images in the external test set are closer to the actual clinical environment, and the imaging of the human face is clearer and more obvious, the detection of this part of the images using YOLOv8-ACU can have an extremely strong recognition and detection ability, and the predicted acupoint positions are more closely matched to the actual acupoint positions. However, due to a variety of factors such as sample size and individual differences, the model still has some error and uncertainty, and there is still room for improvement in recognition accuracy and precision. In the future, the acupoint detection method will be further improved to enhance the accuracy and reliability and ensure the applicability in different environments and populations.</p>
<fig id="F9" position="float">
<label>Figure 9</label>
<caption><p>Acupoint-I acupoint prediction results.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnbot-18-1355857-g0009.tif"/>
</fig>
<fig id="F10" position="float">
<label>Figure 10</label>
<caption><p>Acupoint-II acupoint prediction results.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnbot-18-1355857-g0010.tif"/>
</fig>
</sec>
</sec>
</sec>
<sec sec-type="discussion" id="s5">
<title>Discussion</title>
<p>Acupuncture points are a key concept in Chinese medicine, different points have different effects, and the precise identification of points is also the most important part of the acupuncture therapy process (Li et al., <xref ref-type="bibr" rid="B18">2015</xref>). There are fewer studies applying keypoint detection models to acupoint recognition, Zhang et al. (<xref ref-type="bibr" rid="B43">2023</xref>) used the FADbR model to detect the acupoints on the face, and most of the acupoints are detected well, but the detection effect is poor in the sparse position of the acupoints, and the model only has the ability of keypoint detection, while YOLOv8-ACU has the ability of both the target detection and the keypoint detection, which is able to have a better interactivity, and the applicable scenarios are more abundant. In comparison with YOLO-pose (Maji et al., <xref ref-type="bibr" rid="B25">2022</xref>) and YOLOv7-pose (Pranavan et al., <xref ref-type="bibr" rid="B28">2023</xref>) YOLOv8-ACU can also be found to have better accuracy and lighter model size.</p>
<p>By comparing YOLOv8-ACU, YOLOv8-pose, YOLOv7-pose, YOLO-pose, it can be found that YOLOv8-ACU not only shows better results in accuracy, but also is lighter in model size, and has a good generalization ability in the external test set. It shows that the recognition effect and performance of the model can be effectively improved by adding the ECA attention mechanism, using the Slim-neck module and changing to the GIoU loss function.</p>
<p>However, the model also has some defects. There are fewer categories of acupoints, which do not cover all the acupoints on the face, and there is no classification experiment for data under various light and occlusion conditions, which may lead to errors in the detection and localization of acupoints under low light, dark light or occlusion conditions. In the future, we will further expand the categories of facial acupoints and improve the performance of detecting acupoints under different occlusions and different light conditions, and deploy them in embedded devices for real clinical practice.</p>
</sec>
<sec sec-type="conclusions" id="s6">
<title>Conclusions</title>
<p>To enhance the accuracy of facial acupoint recognition for better application in clinical practice, this study utilized the YOLOv8-pose model, which has been recently introduced with high detection and localization accuracy, as the base model. It was applied to the task of facial acupoint recognition. Building upon this base model, the study incorporated the ECA attention mechanism, introduced the Slim-neck module, and replaced its loss function. These enhancements further improved the precise recognition of acupoints while reducing the model&#x00027;s complexity and computational load. Compared to the base YOLOv8-pose model, YOLOv8-ACU demonstrated improvements in Precision (&#x0002B;0.2%), Recall (&#x0002B;2.0%), mAP&#x00040;0.5 (&#x0002B;1.8%), and mAP&#x00040;0.5&#x02013;0.95 (&#x0002B;3.1%). Additionally, the Parameters, Model Size and GFLOPs decreased by 0.44M, 0.82MB, and 9.3% respectively. Comparing with other keypoint models, YOLOv8-ACU emerged as the most suitable model for acupoint recognition.</p>
</sec>
<sec sec-type="data-availability" id="s7">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec sec-type="ethics-statement" id="s8">
<title>Ethics statement</title>
<p>Written informed consent was obtained from the individual(s) for the publication of any potentially identifiable images or data included in this article.</p>
</sec>
<sec sec-type="author-contributions" id="s9">
<title>Author contributions</title>
<p>ZY: Conceptualization, Data curation, Formal analysis, Funding acquisition, Investigation, Methodology, Project administration, Resources, Software, Supervision, Validation, Visualization, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. PS: Formal analysis, Funding acquisition, Methodology, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing, Project administration, Resources. JL: Conceptualization, Data curation, Formal analysis, Funding acquisition, Writing &#x02013; original draft. YW: Investigation, Methodology, Project administration, Supervision, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. ZZ: Data curation, Writing &#x02013; original draft. WQ: Data curation, Writing &#x02013; original draft. BC: Data curation, Writing &#x02013; original draft. YT: Resources, Software, Supervision, Validation, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. AH: Conceptualization, Software, Supervision, Validation, Visualization, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing.</p>
</sec>
</body>
<back>
<sec sec-type="funding-information" id="s10">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research, authorship, and/or publication of this article. This research was supported in part by the China Ministry of Education Industry-University Cooperation Collaborative Education Project (220500643305240).</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s11">
<title>Publisher&#x00027;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Berretti</surname> <given-names>S.</given-names></name> <name><surname>Ben Amor</surname> <given-names>B.</given-names></name> <name><surname>Daoudi</surname> <given-names>M.</given-names></name> <name><surname>Del Bimbo</surname> <given-names>A</given-names></name></person-group>. (<year>2011</year>), <article-title>3D. facial expression recognition using SIFT descriptors of automatically detected keypoints</article-title>. <source>The Visual Comput</source>. <volume>27</volume>, <fpage>1021</fpage>&#x02013;<lpage>1036</lpage>. <pub-id pub-id-type="doi">10.1007/s00371-011-0611-x</pub-id></citation>
</ref>
<ref id="B2">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Cai</surname> <given-names>Z.</given-names></name> <name><surname>Vasconcelos</surname> <given-names>N.</given-names></name></person-group> (<year>2018</year>). <article-title>&#x0201C;Cascade r-cnn: delving into high quality object detection,&#x0201D;</article-title> in <source>Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition.</source> <publisher-loc>Piscataway, NJ</publisher-loc>: <publisher-name>IEEE</publisher-name>, <fpage>6154</fpage>&#x02013;<lpage>6162</lpage>.</citation>
</ref>
<ref id="B3">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chon</surname> <given-names>T. Y.</given-names></name> <name><surname>Lee</surname> <given-names>M. C.</given-names></name></person-group> (<year>2013</year>). <article-title>Acupuncture</article-title>. <source>Mayo Clin. Proc</source>. <volume>88</volume>, <fpage>1141</fpage>&#x02013;<lpage>1146</lpage>. <pub-id pub-id-type="doi">10.1016/j.mayocp.2013.06.009</pub-id></citation>
</ref>
<ref id="B4">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cootes</surname> <given-names>T.</given-names></name> <name><surname>Edwards</surname> <given-names>J.</given-names></name> <name><surname>Taylor</surname> <given-names>C.</given-names></name></person-group> (<year>1998</year>). <article-title>Active apperance models. IEEE transactions on pattern analysis and machine intelligence</article-title>. <source>IEEE Trans. Pattern Anal. Mach. Int.</source> <volume>23</volume>, <fpage>681685</fpage>. <pub-id pub-id-type="doi">10.1109/34.927467</pub-id></citation>
</ref>
<ref id="B5">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cootes</surname> <given-names>T. F.</given-names></name> <name><surname>Taylor</surname> <given-names>C. J.</given-names></name> <name><surname>Cooper</surname> <given-names>D. H.</given-names></name> <name><surname>Graham</surname> <given-names>J.</given-names></name></person-group> (<year>1995</year>). <article-title>Active shape models-their training and application</article-title>. <source>Computer Vision Image Understanding</source> <volume>61</volume>, <fpage>38</fpage>&#x02013;<lpage>59</lpage>. <pub-id pub-id-type="doi">10.1006/cviu.1995.1004</pub-id></citation>
</ref>
<ref id="B6">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Deng</surname> <given-names>J.</given-names></name> <name><surname>Guo</surname> <given-names>J.</given-names></name> <name><surname>Xue</surname> <given-names>N.</given-names></name> <name><surname>Zafeiriou</surname> <given-names>S.</given-names></name></person-group> (<year>2019</year>). <article-title>&#x0201C;Arcface: Additive angular margin loss for deep face recognition,&#x0201D;</article-title> in <source>Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition.</source> <publisher-loc>Piscataway, NJ</publisher-loc>: <publisher-name>IEEE</publisher-name>, <fpage>4690</fpage>&#x02013;<lpage>4699</lpage>.<pub-id pub-id-type="pmid">34106845</pub-id></citation></ref>
<ref id="B7">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Deng</surname> <given-names>Y.</given-names></name> <name><surname>Hui</surname> <given-names>S.</given-names></name> <name><surname>Zhou</surname> <given-names>S.</given-names></name> <name><surname>Huang</surname> <given-names>W.</given-names></name> <name><surname>Wang</surname> <given-names>J.</given-names></name></person-group> (<year>2023</year>). <source>Context Adaptive Network for Image Inpainting. IEEE Transactions on Image Processing</source>. <pub-id pub-id-type="doi">10.1109/TIP.2023.3298560</pub-id><pub-id pub-id-type="pmid">37506026</pub-id></citation></ref>
<ref id="B8">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Doll&#x000E1;r</surname> <given-names>P.</given-names></name> <name><surname>Welinder</surname> <given-names>P.</given-names></name> <name><surname>Perona</surname> <given-names>P.</given-names></name></person-group> (<year>2010</year>). <article-title>&#x0201C;Cascaded pose regression,&#x0201D;</article-title> in <source>2010 IEEE Computer Society Conference on Computer Vision and Pattern Recognition</source>, <publisher-loc>Piscataway, NJ</publisher-loc>: <publisher-name>IEEE</publisher-name>, <fpage>1078</fpage>&#x02013;<lpage>1085</lpage>.</citation>
</ref>
<ref id="B9">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Elfwing</surname> <given-names>S.</given-names></name> <name><surname>Uchibe</surname> <given-names>E.</given-names></name> <name><surname>Doya</surname> <given-names>K.</given-names></name></person-group> (<year>2018</year>). <article-title>Sigmoid-weighted linear units for neural network function approximation in reinforcement learning</article-title>. <source>Neural Netw.</source> <volume>107</volume>, <fpage>3</fpage>&#x02013;<lpage>11</lpage>. <pub-id pub-id-type="doi">10.1016/j.neunet.2017.12.012</pub-id><pub-id pub-id-type="pmid">29395652</pub-id></citation></ref>
<ref id="B10">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Godson</surname> <given-names>D. R.</given-names></name> <name><surname>Wardle</surname> <given-names>J. L.</given-names></name></person-group> (<year>2019</year>). <article-title>Accuracy and precision in acupuncture point location: a critical systematic review</article-title>. <source>J. Acupunctur. Merid. Stu.</source> <volume>12</volume>, <fpage>52</fpage>&#x02013;<lpage>66</lpage>. <pub-id pub-id-type="doi">10.1016/j.jams.2018.10.009</pub-id></citation>
</ref>
<ref id="B11">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>He</surname> <given-names>K.</given-names></name> <name><surname>Zhang</surname> <given-names>X.</given-names></name> <name><surname>Ren</surname> <given-names>S.</given-names></name> <name><surname>Sun</surname> <given-names>J.</given-names></name></person-group> (<year>2016</year>). <article-title>&#x0201C;Deep residual learning for image recognition,&#x0201D;</article-title> in <source>Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition.</source> <publisher-loc>Piscataway, NJ</publisher-loc>: <publisher-name>IEEE</publisher-name>, <fpage>770</fpage>&#x02013;<lpage>778</lpage>.</citation>
</ref>
<ref id="B12">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Hu</surname> <given-names>J.</given-names></name> <name><surname>Shen</surname> <given-names>L.</given-names></name> <name><surname>Sun</surname> <given-names>G.</given-names></name></person-group> (<year>2018</year>). <article-title>&#x0201C;Squeeze-and-excitation networks,&#x0201D;</article-title> in <source>Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition.</source> <publisher-loc>Piscataway, NJ</publisher-loc>: <publisher-name>IEEE</publisher-name>, <fpage>7132</fpage>&#x02013;<lpage>7141</lpage>.</citation>
</ref>
<ref id="B13">
<citation citation-type="book"><person-group person-group-type="author"><collab>International Organisation for Standardization</collab></person-group> (<year>2021</year>). <source>ISO 16672. Traditional Chinese Medicine - International Code for Acupuncture Points.</source> <publisher-loc>Geneva</publisher-loc>: <publisher-name>ISO</publisher-name>.</citation>
</ref>
<ref id="B14">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jin</surname> <given-names>B.</given-names></name> <name><surname>Cruz</surname> <given-names>L.</given-names></name> <name><surname>Gon&#x000E7;alves</surname> <given-names>N.</given-names></name></person-group> (<year>2020</year>). <article-title>Deep facial diagnosis: deep transfer learning from face recognition to facial diagnosis</article-title>. <source>IEEE Access</source> <volume>8</volume>, <fpage>123649</fpage>&#x02013;<lpage>123661</lpage>. <pub-id pub-id-type="doi">10.1109/ACCESS.2020.3005687</pub-id></citation>
</ref>
<ref id="B15">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jin</surname> <given-names>B.</given-names></name> <name><surname>Cruz</surname> <given-names>L.</given-names></name> <name><surname>Goncalves</surname> <given-names>N.</given-names></name></person-group> (<year>2022</year>). <article-title>Pseudo RGB-D face recognition</article-title>. <source>IEEE Sensors J.</source> <volume>22</volume>, <fpage>21780</fpage>&#x02013;<lpage>21794</lpage>.. <pub-id pub-id-type="doi">10.1109/JSEN.2022.3197235</pub-id></citation>
</ref>
<ref id="B16">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jocher</surname> <given-names>G.</given-names></name> <name><surname>Stoken</surname> <given-names>A.</given-names></name> <name><surname>Borovec</surname> <given-names>J.</given-names></name> <name><surname>Changyu</surname> <given-names>L.</given-names></name> <name><surname>Hogan</surname> <given-names>A.</given-names></name> <name><surname>Diaconu</surname> <given-names>L.</given-names></name> <etal/></person-group>. (<year>2020</year>). ultralytics/yolov5, v3. 0. Zenodo.</citation>
</ref>
<ref id="B17">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname> <given-names>Y. S.</given-names></name> <name><surname>Ryu</surname> <given-names>Y.</given-names></name> <name><surname>Yoon</surname> <given-names>D. E.</given-names></name> <name><surname>Kim</surname> <given-names>C. H.</given-names></name> <name><surname>Hong</surname> <given-names>G.</given-names></name> <name><surname>Hwang</surname> <given-names>Y. C.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Commonality and specificity of acupuncture point selections</article-title>. <source>Evid. Based Complem Alternat. Med.</source> <pub-id pub-id-type="doi">10.1155/2020/2948292</pub-id><pub-id pub-id-type="pmid">32802119</pub-id></citation></ref>
<ref id="B18">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>F.</given-names></name> <name><surname>He</surname> <given-names>T.</given-names></name> <name><surname>Xu</surname> <given-names>Q.</given-names></name> <name><surname>Lin</surname> <given-names>L. T.</given-names></name> <name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Liu</surname> <given-names>Y.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>What is the acupoint? A preliminary review of acupoints</article-title>. <source>Pain Med.</source> <volume>16</volume>, <fpage>1905</fpage>&#x02013;<lpage>1915</lpage>. <pub-id pub-id-type="doi">10.1111/pme.12761</pub-id><pub-id pub-id-type="pmid">25975413</pub-id></citation></ref>
<ref id="B19">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Li</surname> <given-names>J.</given-names></name> <name><surname>Wei</surname> <given-names>H.</given-names></name> <name><surname>Liu</surname> <given-names>Z.</given-names></name> <name><surname>Zhan</surname> <given-names>Z.</given-names></name> <name><surname>Ren</surname> <given-names>Q.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Slim-neck by GSConv: A better design paradigm of detector architectures for autonomous vehicles</article-title>. <source>arXiv [Preprint]. arXiv:2206.02424.</source></citation>
</ref>
<ref id="B20">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lim</surname> <given-names>S.</given-names></name></person-group> (<year>2010</year>). <article-title>WHO standard acupuncture point locations</article-title>. <source>Evid. Based Complem. Alternat. Med.</source> <volume>7</volume>, <fpage>167</fpage>&#x02013;<lpage>168</lpage>. <pub-id pub-id-type="doi">10.1093/ecam/nep006</pub-id><pub-id pub-id-type="pmid">19204011</pub-id></citation></ref>
<ref id="B21">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lin</surname> <given-names>S.</given-names></name> <name><surname>Yi</surname> <given-names>P.</given-names></name></person-group> (<year>2019</year>). <article-title>Human acupoint positioning system based on binocular vision</article-title>. <source>IOP Conf. Series Mat. Sci. Eng.</source> <volume>569</volume>, <fpage>042029</fpage>. <pub-id pub-id-type="doi">10.1088/1757-899X/569/4/042029</pub-id></citation>
</ref>
<ref id="B22">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Lin</surname> <given-names>T. Y.</given-names></name> <name><surname>Doll&#x000E1;r</surname> <given-names>P.</given-names></name> <name><surname>Girshick</surname> <given-names>R.</given-names></name> <name><surname>He</surname> <given-names>K.</given-names></name> <name><surname>Hariharan</surname> <given-names>B.</given-names></name> <name><surname>Belongie</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2017</year>). <article-title>&#x0201C;Feature pyramid networks for object detection,&#x0201D;</article-title> in <source>Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition</source>. <publisher-loc>Piscataway, NJ</publisher-loc>: <publisher-name>IEEE</publisher-name>, <fpage>2117</fpage>&#x02013;<lpage>2125</lpage>.</citation>
</ref>
<ref id="B23">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>S.</given-names></name> <name><surname>Qi</surname> <given-names>L.</given-names></name> <name><surname>Qin</surname> <given-names>H.</given-names></name> <name><surname>Shi</surname> <given-names>J.</given-names></name> <name><surname>Jia</surname> <given-names>J.</given-names></name></person-group> (<year>2018</year>). <article-title>&#x0201C;Path aggregation network for instance segmentation,&#x0201D;</article-title> in <source>Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition.</source> <publisher-loc>Piscataway, NJ</publisher-loc>: <publisher-name>IEEE</publisher-name>, <fpage>8759</fpage>&#x02013;<lpage>8768</lpage>.</citation>
</ref>
<ref id="B24">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lowe</surname> <given-names>D. G.</given-names></name></person-group> (<year>2004</year>). <article-title>Distinctive image features from scale-invariant keypoints</article-title>. <source>Int. J. Comput. Vision</source> <volume>60</volume>, <fpage>91</fpage>&#x02013;<lpage>110</lpage>. <pub-id pub-id-type="doi">10.1023/B:VISI.0000029664.99615.94</pub-id></citation>
</ref>
<ref id="B25">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Maji</surname> <given-names>D.</given-names></name> <name><surname>Nagori</surname> <given-names>S.</given-names></name> <name><surname>Mathew</surname> <given-names>M.</given-names></name> <name><surname>Poddar</surname> <given-names>D.</given-names></name></person-group> (<year>2022</year>). <article-title>&#x0201C;Yolo-pose: Enhancing yolo for multi person pose estimation using object keypoint similarity loss,&#x0201D;</article-title> in <source>Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition.</source> <publisher-loc>Piscataway, NJ</publisher-loc>: <publisher-name>IEEE</publisher-name>, <fpage>2637</fpage>&#x02013;<lpage>2646</lpage>.</citation>
</ref>
<ref id="B26">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Newell</surname> <given-names>A.</given-names></name> <name><surname>Yang</surname> <given-names>K.</given-names></name> <name><surname>Deng</surname> <given-names>J.</given-names></name></person-group> (<year>2016</year>). <article-title>&#x0201C;Stacked hourglass networks for human pose estimation,&#x0201D;</article-title> in <source>Computer Vision&#x02013;ECCV 2016, 14th European Conference, Amsterdam, The Netherlands.</source> <publisher-loc>Amsterdam</publisher-loc>: <publisher-name>Springer International Publishing</publisher-name>, <fpage>483</fpage>&#x02013;<lpage>499</lpage>.</citation>
</ref>
<ref id="B27">
<citation citation-type="web"><person-group person-group-type="author"><name><surname>Platt</surname> <given-names>J.</given-names></name></person-group> (<year>1998</year>). <source>Sequential Minimal Optimization: a Fast Algorithm for Training Support Vector Machines</source>. Technical Report MSR- TR-98-14, Microsoft Research. Available online at: <ext-link ext-link-type="uri" xlink:href="http://www.research.microsoft.comrjplattlsmo.html">http://www.research.microsoft.comrjplattlsmo.html</ext-link></citation>
</ref>
<ref id="B28">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Pranavan</surname> <given-names>V. M.</given-names></name> <name><surname>Shekar</surname> <given-names>M.</given-names></name> <name><surname>Ngadiran</surname> <given-names>R.</given-names></name> <name><surname>Ravindran</surname> <given-names>S.</given-names></name></person-group> (<year>2023</year>). <article-title>&#x0201C;Fall detection system for monitoring elderly people using YOLOv7-pose detection model,&#x0201D;</article-title> in <source>2023 International Conference on Computer, Electronics and Electrical Engineering and their Applications (IC2E3).</source> <publisher-loc>Piscataway, NJ</publisher-loc>: <publisher-name>IEEE</publisher-name>, <fpage>1</fpage>&#x02013;<lpage>6</lpage>.</citation>
</ref>
<ref id="B29">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Qian</surname> <given-names>Q.</given-names></name> <name><surname>Chen</surname> <given-names>L.</given-names></name> <name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Jin</surname> <given-names>R.</given-names></name></person-group> (<year>2020</year>). <article-title>&#x0201C;Dr loss: Improving object detection by distributional ranking,&#x0201D;</article-title> in <source>Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition.</source> <publisher-loc>Piscataway, NJ</publisher-loc>: <publisher-name>IEEE</publisher-name>, <fpage>12164</fpage>&#x02013;<lpage>12172</lpage>.</citation>
</ref>
<ref id="B30">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Redmon</surname> <given-names>J.</given-names></name> <name><surname>Divvala</surname> <given-names>S.</given-names></name> <name><surname>Girshick</surname> <given-names>R.</given-names></name> <name><surname>Farhadi</surname> <given-names>A.</given-names></name></person-group> (<year>2016</year>). <article-title>&#x0201C;You only look once: unified, real-time object detection,&#x0201D;</article-title> in <source>Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition.</source> <publisher-loc>Piscataway, NJ</publisher-loc>: <publisher-name>IEEE</publisher-name>, <fpage>779</fpage>&#x02013;<lpage>788</lpage>.</citation>
</ref>
<ref id="B31">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ren</surname> <given-names>A.</given-names></name> <name><surname>Li</surname> <given-names>Z.</given-names></name> <name><surname>Ding</surname> <given-names>C.</given-names></name> <name><surname>Qiu</surname> <given-names>Q.</given-names></name> <name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Li</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2017</year>). <article-title>Sc-dcnn: highly-scalable deep convolutional neural network using stochastic computing</article-title>. <source>ACM SIGPLAN Notices</source> <volume>52</volume>, <fpage>405</fpage>&#x02013;<lpage>418</lpage>. <pub-id pub-id-type="doi">10.1145/3093336.3037746</pub-id></citation>
</ref>
<ref id="B32">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ren</surname> <given-names>S.</given-names></name> <name><surname>He</surname> <given-names>K.</given-names></name> <name><surname>Girshick</surname> <given-names>R.</given-names></name> <name><surname>Sun</surname> <given-names>J.</given-names></name></person-group> (<year>2015</year>). <article-title>Faster r-cnn: towards real-time object detection with region proposal networks</article-title>. <source>Adv. Neural Inf. Proc. Syst.</source> <volume>28</volume>, <fpage>1</fpage>&#x02013;<lpage>14</lpage>.<pub-id pub-id-type="pmid">27295650</pub-id></citation></ref>
<ref id="B33">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Rezatofighi</surname> <given-names>H.</given-names></name> <name><surname>Tsoi</surname> <given-names>N.</given-names></name> <name><surname>Gwak</surname> <given-names>J.</given-names></name> <name><surname>Sadeghian</surname> <given-names>A.</given-names></name> <name><surname>Reid</surname> <given-names>I.</given-names></name> <name><surname>Savarese</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>&#x0201C;Generalized intersection over union: a metric and a loss for bounding box regression,&#x0201D;</article-title> in <source>Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition.</source> <publisher-loc>Piscataway, NJ</publisher-loc>: <publisher-name>IEEE</publisher-name>, <fpage>658</fpage>&#x02013;<lpage>666</lpage>.</citation>
</ref>
<ref id="B34">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Sandler</surname> <given-names>M.</given-names></name> <name><surname>Howard</surname> <given-names>A.</given-names></name> <name><surname>Zhu</surname> <given-names>M.</given-names></name> <name><surname>Zhmoginov</surname> <given-names>A.</given-names></name> <name><surname>Chen</surname> <given-names>L. C.</given-names></name></person-group> (<year>2018</year>). <article-title>&#x0201C;Mobilenetv2: inverted residuals and linear bottlenecks,&#x0201D;</article-title> in <source>Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition.</source> <publisher-loc>Piscataway, NJ</publisher-loc>: <publisher-name>IEEE</publisher-name>, <fpage>4510</fpage>&#x02013;<lpage>4520</lpage>.</citation>
</ref>
<ref id="B35">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Sun</surname> <given-names>Y.</given-names></name> <name><surname>Wang</surname> <given-names>X.</given-names></name> <name><surname>Tang</surname> <given-names>X.</given-names></name></person-group> (<year>2013</year>). <article-title>&#x0201C;Deep convolutional network cascade for facial point detection,&#x0201D;</article-title> in <source>Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition.</source> <publisher-loc>Piscataway, NJ</publisher-loc>: <publisher-name>IEEE</publisher-name>, <fpage>3476</fpage>&#x02013;<lpage>3483</lpage>.</citation>
</ref>
<ref id="B36">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Tian</surname> <given-names>L.</given-names></name></person-group> (<year>2010</year>). <source>Acupuncture and Moxibustion for Peripheral Facial Paralysis</source>. <publisher-loc>Shandong</publisher-loc>: <publisher-name>Shandong University of Traditional Chinese Medicine</publisher-name>.</citation>
</ref>
<ref id="B37">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>Q.</given-names></name> <name><surname>Wu</surname> <given-names>B.</given-names></name> <name><surname>Zhu</surname> <given-names>P.</given-names></name> <name><surname>Li</surname> <given-names>P.</given-names></name> <name><surname>Zuo</surname> <given-names>W.</given-names></name> <name><surname>Hu</surname> <given-names>Q.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>&#x0201C;ECA-Net: Efficient channel attention for deep convolutional neural networks,&#x0201D;</article-title> in <source>Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition.</source> <publisher-loc>Piscataway, NJ</publisher-loc>: <publisher-name>IEEE</publisher-name>, <fpage>11534</fpage>&#x02013;<lpage>11542</lpage>.</citation>
</ref>
<ref id="B38">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Wei</surname> <given-names>S. E.</given-names></name> <name><surname>Ramakrishna</surname> <given-names>V.</given-names></name> <name><surname>Kanade</surname> <given-names>T.</given-names></name> <name><surname>Sheikh</surname> <given-names>Y.</given-names></name></person-group> (<year>2016</year>). <article-title>&#x0201C;Convolutional pose machines,&#x0201D;</article-title> in <source>Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition.</source> <publisher-loc>Piscataway, NJ</publisher-loc>: <publisher-name>IEEE</publisher-name>, <fpage>4724</fpage>&#x02013;<lpage>4732</lpage>.</citation>
</ref>
<ref id="B39">
<citation citation-type="book"><person-group person-group-type="author"><collab>World Health Organization and Regional Office for the Western Pacific</collab></person-group> (<year>2008</year>). <source>WHO Standard Acupuncture Point Locations in the Western Pacific Region</source>. <publisher-loc>Geneva</publisher-loc>: <publisher-name>World Health Organization</publisher-name>.</citation>
</ref>
<ref id="B40">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>S.</given-names></name> <name><surname>Luo</surname> <given-names>P.</given-names></name> <name><surname>Loy</surname> <given-names>C. C.</given-names></name> <name><surname>Tang</surname> <given-names>X.</given-names></name></person-group> (<year>2016</year>). <article-title>&#x0201C;Wider face: a face detection benchmark,&#x0201D;</article-title> in <source>Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition.</source> <publisher-loc>Piscataway, NJ</publisher-loc>: <publisher-name>IEEE</publisher-name>, <fpage>5525</fpage>&#x02013;<lpage>5533</lpage>.</citation>
</ref>
<ref id="B41">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Yu</surname> <given-names>J.</given-names></name> <name><surname>Jiang</surname> <given-names>Y.</given-names></name> <name><surname>Wang</surname> <given-names>Z.</given-names></name> <name><surname>Cao</surname> <given-names>Z.</given-names></name> <name><surname>Huang</surname> <given-names>T.</given-names></name></person-group> (<year>2016</year>). <article-title>&#x0201C;Unitbox: an advanced object detection network,&#x0201D;</article-title> in <source>Proceedings of the 24th ACM International Conference on Multimedia.</source> <publisher-loc>Piscataway, NJ</publisher-loc>: <publisher-name>IEEE</publisher-name>, <fpage>516</fpage>&#x02013;<lpage>520</lpage>.</citation>
</ref>
<ref id="B42">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yu</surname> <given-names>Q.</given-names></name> <name><surname>Liang</surname> <given-names>J.</given-names></name> <name><surname>Liu</surname> <given-names>Y.</given-names></name></person-group> (<year>2021</year>). <article-title>Data mining analysis on the selection pattern of acupuncture points for peripheral facial paralysis</article-title>. <source>China TCM Emerg.</source> <volume>30</volume>, <fpage>1522</fpage>&#x02013;<lpage>1526</lpage>.</citation>
</ref>
<ref id="B43">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>T.</given-names></name> <name><surname>Yang</surname> <given-names>H.</given-names></name> <name><surname>Lin</surname> <given-names>Y.</given-names></name></person-group> (<year>2023</year>). <article-title>A framework for detecting facial acupoints in traditional Chinese medicine by integrating representation learning</article-title>. <source>J. Univ. Electr. Sci. Technol.</source> <volume>52</volume>, <fpage>175</fpage>&#x02013;<lpage>181</lpage>.</citation>
</ref>
<ref id="B44">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Zheng</surname> <given-names>C.</given-names></name></person-group> (<year>2022</year>). <source>Research on AR System for Facial Acupoint Recognition Based on Deep Learning</source>. <publisher-loc>Qingdao</publisher-loc>: <publisher-name>Qingdao University of Science and Technology</publisher-name>.</citation>
</ref>
<ref id="B45">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zheng</surname> <given-names>H.</given-names></name> <name><surname>Li</surname> <given-names>Y.</given-names></name> <name><surname>Chen</surname> <given-names>M.</given-names></name></person-group> (<year>2009</year>). <article-title>Evidence based acupuncture practice recommendations for peripheral facial paralysis</article-title>. <source>The Am. J. Chin. Med.</source> <volume>37</volume>, <fpage>35</fpage>&#x02013;<lpage>43</lpage>. <pub-id pub-id-type="doi">10.1142/S0192415X09006631</pub-id><pub-id pub-id-type="pmid">19222110</pub-id></citation></ref>
<ref id="B46">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zheng</surname> <given-names>L.</given-names></name> <name><surname>Qin</surname> <given-names>B.</given-names></name> <name><surname>Zhuang</surname> <given-names>T.</given-names></name> <name><surname>Tiede</surname> <given-names>U.</given-names></name> <name><surname>H&#x000F6;hne</surname> <given-names>K. H.</given-names></name></person-group> (<year>2005</year>). <article-title>Localization of acupoints on a head based on a 3D virtual body</article-title>. <source>Image Vision Computing</source> <volume>23</volume>, <fpage>1</fpage>&#x02013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1016/j.imavis.2004.03.005</pub-id></citation>
</ref>
<ref id="B47">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zheng</surname> <given-names>Z.</given-names></name> <name><surname>Wang</surname> <given-names>P.</given-names></name> <name><surname>Liu</surname> <given-names>W.</given-names></name> <name><surname>Li</surname> <given-names>J.</given-names></name> <name><surname>Ye</surname> <given-names>R.</given-names></name> <name><surname>Ren</surname> <given-names>D.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Distance-IoU loss: Faster and better learning for bounding box regression</article-title>. <source>Proc. AAAI Conf. Artf. Int.</source> <volume>34</volume>, <fpage>12993</fpage>&#x02013;<lpage>13000</lpage>. <pub-id pub-id-type="doi">10.1609/aaai.v34i07.6999</pub-id></citation>
</ref>
</ref-list>
</back>
</article>