﻿<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.1 20151215//EN" "JATS-journalpublishing1.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="nlm-ta">Explor Med</journal-id>
<journal-id journal-id-type="publisher-id">EM</journal-id>
<journal-title-group>
<journal-title>Exploration of Medicine</journal-title>
</journal-title-group>
<issn pub-type="epub">2692-3106</issn>
<publisher>
<publisher-name>Open Exploration Publishing</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.37349/emed.2024.00250</article-id>
<article-id pub-id-type="manuscript">1001250</article-id>
<article-categories>
<subj-group>
<subject>Original Article</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>MUCM-Net: a Mamba powered UCM-Net for skin lesion segmentation</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-5953-220X</contrib-id>
<name>
<surname>Yuan</surname>
<given-names>Chunyu</given-names>
</name>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role content-type="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing—original draft</role>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing—review &amp; editing</role>
<xref ref-type="aff" rid="I1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="cor1">
<sup>*</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-0677-634X</contrib-id>
<name>
<surname>Zhao</surname>
<given-names>Dongfang</given-names>
</name>
<role content-type="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing—review &amp; editing</role>
<xref ref-type="aff" rid="I2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<contrib-id contrib-id-type="orcid">https://orcid.org/0000-0003-4601-4507</contrib-id>
<name>
<surname>Agaian</surname>
<given-names>Sos S.</given-names>
</name>
<role content-type="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing—review &amp; editing</role>
<role content-type="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<xref ref-type="aff" rid="I1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="I3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="editor">
<name>
<surname>Farrer</surname>
<given-names>Lindsay A.</given-names>
</name>
<role>Academic Editor</role>
<aff>Boston University School of Medicine, USA</aff>
</contrib>
</contrib-group>
<aff id="I1">
<sup>1</sup>Department of Computer Science, The Graduate Center, City University of New York, New York, NY 10016, USA</aff>
<aff id="I2">
<sup>2</sup>Paul G. Allen School of Computer Science &amp; Engineering, University of Washington, Seattle, WA 98195, USA</aff>
<aff id="I3">
<sup>3</sup>Department of Computer Science, College of Staten Island, City University of New York, New York, NY 10314, USA</aff>
<author-notes>
<corresp id="cor1">
<sup>*</sup>
<bold>Correspondence:</bold> Chunyu Yuan, Department of Computer Science, The Graduate Center, City University of New York, New York, NY 10016, USA. <email>cyuan1@gradcenter.cuny.edu</email></corresp>
</author-notes>
<pub-date pub-type="ppub">
<year>2024</year>
</pub-date>
<pub-date pub-type="epub">
<day>25</day>
<month>10</month>
<year>2024</year>
</pub-date>
<volume>5</volume>
<issue>6</issue>
<fpage>694</fpage>
<lpage>708</lpage>
<history>
<date date-type="received">
<day>10</day>
<month>06</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>27</day>
<month>08</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>© The Author(s) 2024.</copyright-statement>
<license xlink:href="https://creativecommons.org/licenses/by/4.0/">
<license-p>This is an Open Access article licensed under a Creative Commons Attribution 4.0 International License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, sharing, adaptation, distribution and reproduction in any medium or format, for any purpose, even commercially, as long as you give appropriate credit to the original author(s) and the source, provide a link to the Creative Commons license, and indicate if changes were made.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Aim:</title>
<p id="absp-1">Skin lesion segmentation is critical for early skin cancer detection. Challenges in automatic segmentation from dermoscopic images include variations in color, texture, and artifacts of indistinct lesion boundaries. This study aims to develop and evaluate MUCM-Net, a lightweight and efficient model for skin lesion segmentation, leveraging Mamba state-space models integrated with UCM-Net architecture optimized for mobile deployment and early skin cancer detection.</p>
</sec>
<sec>
<title>Methods:</title>
<p id="absp-2">MUCM-Net combines Convolutional Neural Networks (CNNs), multi-layer perceptions (MLPs), and Mamba elements into a hybrid feature learning module.</p>
</sec>
<sec>
<title>Results:</title>
<p id="absp-3">The model was trained and tested on the International Skin Imaging Collaboration (ISIC) 2017 and ISIC2018 datasets, consisting of 2,000 and 2,594 dermoscopic images, respectively. Critical metrics for evaluation included Dice Similarity Coefficient (DSC), sensitivity (SE), specificity (SP), and accuracy (ACC). The model’s computational efficiency was also assessed by measuring Giga Floating-point Operations Per Second (GFLOPS) and the number of parameters. MUCM-Net demonstrated superior performance in skin lesion segmentation with an average DSC of 0.91 on the ISIC2017 dataset and 0.89 on the ISIC2018 dataset, outperforming existing models. It achieved high SE (0.93), SP (0.95), and ACC (0.92) with low computational demands (0.055–0.064 GFLOPS).</p>
</sec>
<sec>
<title>Conclusions:</title>
<p id="absp-4">The model’s innovative Mamba-UCM layer significantly enhanced feature learning while maintaining efficiency that is suitable for mobile devices. MUCM-Net establishes a new standard in lightweight skin lesion segmentation, balancing exceptional ACC with efficient computational performance. Its ability to perform well on mobile devices makes it a scalable tool for early skin cancer detection in resource-limited settings. The open-source availability of MUCM-Net supports further research and collaboration, promoting advances in mobile health diagnostics and the fight against skin cancer. MUCM-Net source code will be posted on <ext-link xlink:href="https://github.com/chunyuyuan/MUCM-Net" ext-link-type="uri">https://github.com/chunyuyuan/MUCM-Net</ext-link>.</p>
</sec>
</abstract>
<kwd-group>
<kwd>Medical image segmentation</kwd>
<kwd>lightweight model</kwd>
<kwd>mobile health</kwd>
<kwd>machine learning</kwd>
<kwd>skin cancer</kwd>
</kwd-group>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p id="p-1">Skin cancer is primarily classified into two major types: melanoma and non-melanoma. Despite melanoma accounting for only 1% of skin cancer cases, it is responsible for the majority of skin cancer-related fatalities due to its aggressive behavior. In 2022, melanoma led to approximately 7,800 deaths in the United States, with an estimated 98,000 new cases anticipated in 2023 [<xref ref-type="bibr" rid="B1">1</xref>]. The lifetime risk for Americans developing skin cancer is alarmingly high, with current statistics showing that one in five individuals will be affected. This underscores the critical need for effective diagnostic and treatment approaches. The financial impact is also considerable, with skin cancer treatment in the U.S. exceeding $8.1 billion [<xref ref-type="bibr" rid="B2">2</xref>]. Malignant melanoma, in particular, is notorious for its rapid progression and high mortality rate, making early and accurate detection essential for improving patient outcomes. Dermatoscopy and dermoscopy play a vital role in the clinical evaluation of skin lesions, helping dermatologists to identify malignant characteristics [<xref ref-type="bibr" rid="B3">3</xref>–<xref ref-type="bibr" rid="B5">5</xref>]. However, manual interpretation can be time-consuming and error-prone, dependent on the clinician’s expertise. Recent advancements have introduced machine learning-driven techniques into clinical practice to improve diagnosis accuracy and efficiency. These techniques are particularly beneficial in computationally constrained environments like mobile health applications [<xref ref-type="bibr" rid="B6">6</xref>, <xref ref-type="bibr" rid="B7">7</xref>].</p>
<p id="p-2">Manual interpretation can be time-consuming, error-prone, and heavily dependent on the clinician’s expertise. Furthermore, certain medical samples present considerable challenges [<xref ref-type="bibr" rid="B8">8</xref>]. These challenges include indistinct boundaries where lesions merge seamlessly with the surrounding skin, making it difficult to delineate them clearly. Variations in lighting can alter the appearance of lesions, affecting the consistency of their visual features. Obstructions such as hair and bubbles may obscure lesion edges, complicating accurate segmentation. Additionally, variations in lesion size and shape, along with inconsistencies in imaging conditions and resolutions, can lead to inaccuracies in the segmentation process. Age-related skin changes can impact texture and appearance, further complicating detection. Complex backgrounds and differences in skin tone, influenced by factors such as race and environmental conditions, also contribute to the difficulty of achieving precise segmentation. Addressing these issues requires advanced techniques that can adapt to these varying conditions and ensure accurate diagnosis. <xref ref-type="fig" rid="fig1">Figure 1</xref> presents some representative complex skin lesion samples.</p>
<fig id="fig1" position="float">
<label>Figure 1</label>
<caption>
<p id="fig1-p-1">
<bold>Complex skin lesion samples</bold>. (<bold>A</bold>) Artifacts arising from the image acquisition process; (<bold>B</bold>) lesions obstructed by hair; (<bold>C</bold>) subtle differences between lesion and skin color; (<bold>D</bold>) low contrast between the wound and surrounding skin</p>
<p id="fig1-p-2">
<italic>Note.</italic> Source from International Skin Imaging Collaboration (ISIC) datasets [<xref ref-type="bibr" rid="B18">18</xref>–<xref ref-type="bibr" rid="B21">21</xref>]</p>
</caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="em-05-1001250-g001.tif" />
</fig>
<p id="p-3">Recent advancements in artificial intelligence (AI) have increasingly integrated computer-aided tools into clinical practice to enhance skin cancer diagnosis [<xref ref-type="bibr" rid="B9">9</xref>, <xref ref-type="bibr" rid="B10">10</xref>]. A crucial technique in this process is skin cancer segmentation, which accurately delineates the boundaries of skin lesions in medical images. This segmentation is vital for accurately assessing lesion characteristics, monitoring their progression, and guiding treatment decisions. With rapid advancements in AI techniques and the widespread adoption of smart devices, such as point-of-care ultrasound (POCUS) devices or smartphones [<xref ref-type="bibr" rid="B11">11</xref>–<xref ref-type="bibr" rid="B13">13</xref>], AI-driven approaches for skin cancer detection have become popular.</p>
<p id="p-4">Patients now enjoy enhanced access to medical information, remote monitoring, and tailored care, which has improved their overall satisfaction with healthcare services. Despite these positive changes, certain obstacles remain, particularly in medical diagnostics. A notable issue is the precise and efficient segmentation of skin lesions, which is critical for diagnosis but challenging to implement on devices with limited computational resources. Most AI-driven medical applications rely on deep learning techniques described in detail by [<xref ref-type="bibr" rid="B14">14</xref>]. These methods typically require significant computational power and extensive learning parameters to deliver accurate predictions, posing a challenge for integration into devices with constrained hardware capabilities [<xref ref-type="bibr" rid="B15">15</xref>, <xref ref-type="bibr" rid="B16">16</xref>].</p>
<p id="p-5">In this study, we extend our previous method UCM-Net [<xref ref-type="bibr" rid="B17">17</xref>], and introduce MUCM-Net, a lightweight, robust, and Mamba-powered approach for skin lesion segmentation. MUCM-Net leverages a new novel hybrid module that combines Convolutional Neural Networks (CNNs), multi-layer perceptions (MLPs), and Mamba to enhance feature learning. Utilizing new proposed group loss functions, our method surpasses existing Mamba-based techniques in skin lesion segmentation. <xref ref-type="fig" rid="fig2">Figure 2</xref> presents the visualization of comparative experimental results on the International Skin Imaging Collaboration (ISIC) 2017 dataset [<xref ref-type="bibr" rid="B18">18</xref>, <xref ref-type="bibr" rid="B19">19</xref>]. More results will be provided in the following “<xref ref-type="sec" rid="s3">Results</xref> and <xref ref-type="sec" rid="s4">Discussion</xref>” sessions.</p>
<fig id="fig2" position="float">
<label>Figure 2</label>
<caption>
<p id="fig2-p-1">
<bold>Comparative results on the International Skin Imaging Collaboration (ISIC) 2017 dataset</bold>. The X-axis shows the Dice Similarity Coefficient (DSC, higher values indicate better performance), and the Y-axis represents Giga Floating-point Operations Per Second (GFLOPS, lower values indicate greater efficiency). LightM-UNet’s result is out of range in the zoom-in window due to GFLOPS</p>
</caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="em-05-1001250-g002.tif" />
</fig>
<p id="p-6">Key contributions of MUCM-Net include:</p>
<p id="p-7">
<list list-type="bullet">
<list-item>
<p>Hybrid feature learning: The MUCM-Net block integrates CNN, MLP, and Mamba elements, enhancing the learning of complex and distinct lesion features. We explore the application of the Mamba structure to increase the feature learning ability.</p>
</list-item>
<list-item>
<p>Computational efficiency: MUCM-Net’s design, based on Mamba-UCM blocks and UCM-Net, prioritizes accuracy and efficiency. It achieves high prediction performance with low computational demands [approx. 0.055–0.064 Giga Floating-point Operations Per Second (GFLOPS)], making it suitable for various deployment scenarios.</p>
</list-item>
<list-item>
<p>Enhanced loss function: A novel loss function integrates output and internal stage losses, ensuring efficient learning during the model’s training process.</p>
</list-item>
<list-item>
<p>Superior results: MUCM-Net achieves exceptional results on the ISIC2017 [<xref ref-type="bibr" rid="B18">18</xref>, <xref ref-type="bibr" rid="B19">19</xref>] and ISIC2018 datasets [<xref ref-type="bibr" rid="B20">20</xref>, <xref ref-type="bibr" rid="B21">21</xref>], outperforming previous Mamba-based methods on metrics like Dice similarity, sensitivity, specificity, and accuracy.</p>
</list-item>
</list>
</p>
<sec id="t1-1">
<title>Related works</title>
<p id="p-8">Tiny machine learning (TinyML) for healthcare: Biomedical imaging segmentation, which involves accurately delineating anatomical structures and pathological regions from medical images, is essential for precise diagnostics. Recent advances in AI have significantly improved segmentation methods, enhancing both their accuracy and efficiency. A burgeoning area of research in this field is the integration of TinyML into healthcare, particularly for applications like lesion segmentation, offering exciting possibilities for both research and practical use.</p>
<p id="p-9">TinyML refers to deploying machine learning models on low-power, compact hardware. This technology holds the potential to revolutionize healthcare by enabling advanced analytical capabilities directly at the point of care. It facilitates real-time, on-device processing, making sophisticated medical image analysis feasible even in settings with limited traditional computing resources or in mobile healthcare environments. For instance, using TinyML for lesion segmentation could provide immediate diagnostic feedback during patient consultations or in remote locations, significantly reducing dependence on extensive infrastructure typically needed for detailed analyses.</p>
<p id="p-10">The incorporation of TinyML into medical devices is expected to enhance diagnostic accuracy, improve patient outcomes, and broaden access to advanced medical technologies in underserved regions. To optimize the deployment of TinyML in these critical applications, researchers are exploring advanced methods such as hyper-structure optimization [<xref ref-type="bibr" rid="B22">22</xref>] and leveraging efficient techniques like binary neural networks [<xref ref-type="bibr" rid="B23">23</xref>].</p>
<p id="p-11">Hyper-structure optimization focuses on reducing the model’s parameter count without sacrificing performance, ensuring the models remain both practical and lightweight for use on miniature devices. Moreover, implementing binary neural networks helps streamline computations, further enhancing the practicality of TinyML applications in resource-constrained settings. As we delve into optimizing and applying models like MUCM-Net in healthcare. This research not only underscores the transformative possibilities of TinyML but also guides future explorations in deploying compact, efficient AI solutions in medical settings.</p>
<p id="p-12">Supervised methods of segmentation: As AI technology continues to advance, the approaches for medical image segmentation have evolved significantly. Initially, the field heavily relied on CNNs such as U-Net, which is essential in medical image segmentation [<xref ref-type="bibr" rid="B24">24</xref>], and its attention-enhanced variant, Att-UNet [<xref ref-type="bibr" rid="B25">25</xref>], which incorporates attention mechanisms to further refine the segmentation accuracy by focusing on relevant features within the images. The development of hybrid architectures marks a further evolution in segmentation techniques. There are some hybrid-based UNets for medical image segmentation: (1) Transformers-related: such as TransUNet [<xref ref-type="bibr" rid="B26">26</xref>], TransFuse [<xref ref-type="bibr" rid="B27">27</xref>], and SANet [<xref ref-type="bibr" rid="B28">28</xref>]; (2) MLP-related: such as ConvNeXts [<xref ref-type="bibr" rid="B29">29</xref>], UNeXt [<xref ref-type="bibr" rid="B30">30</xref>], MALUNet [<xref ref-type="bibr" rid="B31">31</xref>] and its extended version EGE-UNet [<xref ref-type="bibr" rid="B32">32</xref>]. Recently, as Vision Mamba [<xref ref-type="bibr" rid="B33">33</xref>]’s image processing ability with fewer parameters and lower computations, Mamba-based hybrid structure UNets are becoming popular such as VM-UNet [<xref ref-type="bibr" rid="B34">34</xref>], VM-UNet V2 [<xref ref-type="bibr" rid="B35">35</xref>], LightM-UNet [<xref ref-type="bibr" rid="B36">36</xref>], and UltraLight VM-UNet [<xref ref-type="bibr" rid="B37">37</xref>].</p>
<p id="p-13">State-space models (SSMs): SSMs have recently been recognized for their linear complexity concerning input size and memory usage, establishing them as fundamental components for lightweight model architectures [<xref ref-type="bibr" rid="B38">38</xref>]. SSMs are particularly effective at capturing long-range dependencies, offering a critical solution to the convolution challenge of processing information across extensive distances. With the advantage of SSMs, Mamba [<xref ref-type="bibr" rid="B39">39</xref>] has been proven to handle textual data with fewer parameters than Transformers. Similarly, the advent of Vision Mamba has advanced the application of SSMs in image processing, demonstrating a significant memory reduction, all without relying on traditional attention mechanisms. This pioneering research bolsters confidence in Mamba’s potential as a critical lightweight model component in future technological advancements.</p>
<p id="p-14">In this paper, we extend our previous work UCM-Net to propose a new hybrid work MUCM-Net which engages the Mamba’s features learning ability and maintains fewer parameters and lower computations.</p>
</sec>
</sec>
<sec id="s2">
<title>Materials and methods</title>
<sec id="t2-1">
<title>MUCM-Net</title>
<p id="p-15">Network structure design: <xref ref-type="fig" rid="fig3">Figure 3</xref> presents a detailed overview of the structural framework of MUCM-Net, a cutting-edge architecture featuring a unique U-shape design, building upon UCM-Net. MUCM-Net consists of a down-sampling encoder and an up-sampling decoder, forming a robust network for skin lesion segmentation. The network is composed of six encoder-decoder stages, with channel capacities set at {8, 16, 24, 32, 48, 64}. The first stage in the encoder-decoder sequence is a convolutional block, responsible for extracting and capturing critical features. The subsequent stages incorporate our novel UCM-Net blocks, enhancing the network’s performance.</p>
<fig id="fig3" position="float">
<label>Figure 3</label>
<caption>
<p id="fig3-p-1">
<bold>MUCM-Net pipeline</bold>. Conv2D: 2-dimensional convolution</p>
</caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="em-05-1001250-g003.tif" />
</fig>
<p id="p-16">Convolution block: In our design, the first encoder-decoder stage employs a standard convolution layer with a 3 × 3 filter. This convolution block utilizes a 3 × 3 kernel, which is widely used to capture spatial relationships within input features. This kernel size is especially beneficial in the initial layers of the network, where maintaining the spatial integrity of feature maps is crucial for decoding complex input patterns. From the 2nd to the 6th stage, we incorporate a 1 × 1 filter convolution layer, which supports the subsequent Mamba-UCM block. This adjustment significantly reduces the number of learnable parameters and the overall computational load, optimizing the network’s efficiency.</p>
<p id="p-17">Mamba-UCM block: The 2nd–6th stages mainly use the Mamba-UCM block for feature learning. The Mamba-UCM block showcases an advanced strategy that merges UCM-Net block, which contains CNNs with MLPs and Mamba block, to enhance feature learning. There are two advantages in the hybrid structure: (1) CNNs module can enable the model to extract the spatial feature; (2) MLPs and SSM can power the model’s pattern recognition capabilities. The process begins by reshaping the initial input feature map to meet the distinct requirements of CNNs, MLPs, and Mamba. This adaptation involves converting a four-dimensional tensor suitable for CNN processing into a three-dimensional tensor appropriate for MLP and Mamba operations. Inspired by UltraLight VM-UNet and Vision Mamba, we proposed four versions of MUCM-Net with different patch processing. <xref ref-type="fig" rid="fig4">Figure 4</xref> presents the visible differences between the UCM-Net block and the two visions of Mamba-UCM blocks. The PyTorch-style pseudocode in <xref ref-type="fig" rid="fig5">Figure 5</xref> presents our defined sequence of operations, which is how we combine the UCM block and the Mamba block for feature learning.</p>
<fig id="fig4" position="float">
<label>Figure 4</label>
<caption>
<p id="fig4-p-1">
<bold>MUCM-Net Structure</bold>. (<bold>A</bold>) UCM-Net pipeline; (<bold>B</bold>) MUCM-Net (1-patch) pipeline; (<bold>C</bold>) MUCM-Net (2-patch) pipeline. SSM: state-space model; Norm: normalization; Conv2D: 2-dimensional convolution</p>
</caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="em-05-1001250-g004.tif" />
</fig>
<fig id="fig5" position="float">
<label>Figure 5</label>
<caption>
<p id="fig5-p-1">
<bold>Mamba-UCM block pseudocode</bold>
</p>
</caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="em-05-1001250-g005.tif" />
</fig>
</sec>
<sec id="t2-2">
<title>Loss functions</title>
<p id="p-18">In our solution, we designed a new group loss function similar to those used in TransFuse, EGE-UNet, and our previous work, UCM-Net. However, different from theirs, our proposed base loss function is calculated from Binary Cross-Entropy (BCE) loss (1) and Dice loss (2) components and square Dice loss (3) components to calculate the loss from the scaled layer masks in different stages compared with the ground truth masks.</p>
<p id="p-19">The advantages of using different loss functions are as follows:</p>
<p id="p-20">
<list list-type="simple">
<list-item>
<label>1.</label>
<p>BCE loss: Widely used in classification tasks, including biomedical image segmentation, these losses are highly effective for pixel-level segmentation.</p>
</list-item>
<list-item>
<label>2.</label>
<p>Dice loss: Commonly used in biomedical image segmentation, Dice loss addresses class imbalance by focusing on the overlap between predicted and true regions.</p>
</list-item>
<list-item>
<label>3.</label>
<p>Square Dice loss: Further enhances the Dice loss by emphasizing the contribution of well-predicted regions, thereby improving stability and performance.</p>
</list-item>
</list>
</p>
<disp-formula id="eq1"><label>(1)</label><mml:math id="m1" display="block">  <mml:mi>B</mml:mi>  <mml:mi>C</mml:mi>  <mml:mi>E</mml:mi>  <mml:mo>=</mml:mo>  <mml:mo>&#x2013;</mml:mo>  <mml:mfrac>    <mml:mn>1</mml:mn>    <mml:mi>N</mml:mi>  </mml:mfrac>  <mml:munderover>    <mml:mo>&#x2211;</mml:mo>    <mml:mrow>      <mml:mi>i</mml:mi>      <mml:mo>=</mml:mo>      <mml:mn>1</mml:mn>    </mml:mrow>    <mml:mrow>      <mml:mi>N</mml:mi>    </mml:mrow>  </mml:munderover>  <mml:mo stretchy="false">[</mml:mo>  <mml:msub>    <mml:mi>y</mml:mi>    <mml:mrow>      <mml:mi>i</mml:mi>    </mml:mrow>  </mml:msub>  <mml:mi>l</mml:mi>  <mml:mi>o</mml:mi>  <mml:mi>g</mml:mi>  <mml:mo stretchy="false">(</mml:mo>  <mml:msub>    <mml:mi>p</mml:mi>    <mml:mrow>      <mml:mi>i</mml:mi>    </mml:mrow>  </mml:msub>  <mml:mo stretchy="false">)</mml:mo>  <mml:mo>+</mml:mo>  <mml:mo stretchy="false">(</mml:mo>  <mml:mn>1</mml:mn>  <mml:mo>&#x2212;</mml:mo>  <mml:msub>    <mml:mi>y</mml:mi>    <mml:mrow>      <mml:mi>i</mml:mi>    </mml:mrow>  </mml:msub>  <mml:mo stretchy="false">)</mml:mo>  <mml:mi>l</mml:mi>  <mml:mi>o</mml:mi>  <mml:mi>g</mml:mi>  <mml:mo stretchy="false">(</mml:mo>  <mml:mn>1</mml:mn>  <mml:mo>&#x2212;</mml:mo>  <mml:msub>    <mml:mi>p</mml:mi>    <mml:mrow>      <mml:mi>i</mml:mi>    </mml:mrow>  </mml:msub>  <mml:mo stretchy="false">)</mml:mo>  <mml:mo stretchy="false">]</mml:mo></mml:math></disp-formula>
<p id="p-21">where <italic>N</italic> is the total number of pixels (for image segmentation) or elements (for other tasks), <italic>y<sub>i</sub></italic> is the ground truth value, and <italic>p<sub>i</sub></italic> is the predicted probability for the i-th element.</p>
<disp-formula id="eq2"><label>(2)</label><mml:math id="m2" display="block">  <mml:mtext>&#xA0;Dice Loss&#xA0;</mml:mtext>  <mml:mo>=</mml:mo>  <mml:mn>1</mml:mn>  <mml:mo>&#x2212;</mml:mo>  <mml:mfrac>    <mml:mrow>      <mml:mn>2</mml:mn>      <mml:mo>&#xD7;</mml:mo>      <mml:mrow>        <mml:mstyle displaystyle="false" scriptlevel="0">          <mml:munderover>            <mml:mo>&#x2211;</mml:mo>            <mml:mrow>              <mml:mi>i</mml:mi>              <mml:mo>=</mml:mo>              <mml:mn>1</mml:mn>            </mml:mrow>            <mml:mrow>              <mml:mi>N</mml:mi>            </mml:mrow>          </mml:munderover>        </mml:mstyle>      </mml:mrow>      <mml:mo stretchy="false">(</mml:mo>      <mml:msub>        <mml:mi>p</mml:mi>        <mml:mrow>          <mml:mi>i</mml:mi>        </mml:mrow>      </mml:msub>      <mml:mo>&#x22C5;</mml:mo>      <mml:msub>        <mml:mi>y</mml:mi>        <mml:mrow>          <mml:mi>i</mml:mi>        </mml:mrow>      </mml:msub>      <mml:mo stretchy="false">)</mml:mo>      <mml:mo>+</mml:mo>      <mml:mtext>smooth</mml:mtext>    </mml:mrow>    <mml:mrow>      <mml:mstyle displaystyle="false" scriptlevel="0">        <mml:munderover>          <mml:mo>&#x2211;</mml:mo>          <mml:mrow>            <mml:mi>i</mml:mi>            <mml:mo>=</mml:mo>            <mml:mn>1</mml:mn>          </mml:mrow>          <mml:mrow>            <mml:mi>N</mml:mi>          </mml:mrow>        </mml:munderover>        <mml:msub>          <mml:mi>p</mml:mi>          <mml:mrow>            <mml:mi>i</mml:mi>          </mml:mrow>        </mml:msub>        <mml:mo>+</mml:mo>        <mml:mrow>          <mml:mstyle displaystyle="false" scriptlevel="0">            <mml:munderover>              <mml:mo>&#x2211;</mml:mo>              <mml:mrow>                <mml:mi>i</mml:mi>                <mml:mo>=</mml:mo>                <mml:mn>1</mml:mn>              </mml:mrow>              <mml:mrow>                <mml:mi>N</mml:mi>              </mml:mrow>            </mml:munderover>            <mml:msub>              <mml:mi>y</mml:mi>              <mml:mrow>                <mml:mi>i</mml:mi>              </mml:mrow>            </mml:msub>            <mml:mo>+</mml:mo>            <mml:mtext>smooth</mml:mtext>          </mml:mstyle>        </mml:mrow>      </mml:mstyle>    </mml:mrow>  </mml:mfrac></mml:math></disp-formula>
<p id="p-22">where we used a smooth constant, which equals 1e-5, to enhance numerical stability.</p>
<disp-formula id="eq3"><label>(3)</label><mml:math id="m3" display="block">  <mml:mtext>&#xA0;Square Dice Loss&#xA0;</mml:mtext>  <mml:mo>=</mml:mo>  <mml:mn>1</mml:mn>  <mml:mo>&#x2212;</mml:mo>  <mml:mfrac>    <mml:mrow>      <mml:mn>2</mml:mn>      <mml:mo>&#xD7;</mml:mo>      <mml:mo stretchy="false">(</mml:mo>      <mml:mrow>        <mml:mstyle displaystyle="false" scriptlevel="0">          <mml:munderover>            <mml:mo>&#x2211;</mml:mo>            <mml:mrow>              <mml:mi>i</mml:mi>              <mml:mo>=</mml:mo>              <mml:mn>1</mml:mn>            </mml:mrow>            <mml:mrow>              <mml:mi>N</mml:mi>            </mml:mrow>          </mml:munderover>          <mml:mo stretchy="false">(</mml:mo>          <mml:msub>            <mml:mi>p</mml:mi>            <mml:mrow>              <mml:mi>i</mml:mi>            </mml:mrow>          </mml:msub>          <mml:mo>&#x22C5;</mml:mo>          <mml:msub>            <mml:mi>y</mml:mi>            <mml:mrow>              <mml:mi>i</mml:mi>            </mml:mrow>          </mml:msub>          <mml:mo stretchy="false">)</mml:mo>          <mml:msup>            <mml:mo stretchy="false">)</mml:mo>            <mml:mrow>              <mml:mn>2</mml:mn>            </mml:mrow>          </mml:msup>          <mml:mo>+</mml:mo>          <mml:mtext>smooth</mml:mtext>        </mml:mstyle>      </mml:mrow>    </mml:mrow>    <mml:mrow>      <mml:mo stretchy="false">(</mml:mo>      <mml:mrow>        <mml:mstyle displaystyle="false" scriptlevel="0">          <mml:munderover>            <mml:mo>&#x2211;</mml:mo>            <mml:mrow>              <mml:mi>i</mml:mi>              <mml:mo>=</mml:mo>              <mml:mn>1</mml:mn>            </mml:mrow>            <mml:mrow>              <mml:mi>N</mml:mi>            </mml:mrow>          </mml:munderover>          <mml:msub>            <mml:mi>p</mml:mi>            <mml:mrow>              <mml:mi>i</mml:mi>            </mml:mrow>          </mml:msub>          <mml:msup>            <mml:mo stretchy="false">)</mml:mo>            <mml:mrow>              <mml:mn>2</mml:mn>            </mml:mrow>          </mml:msup>          <mml:mo>+</mml:mo>          <mml:mo stretchy="false">(</mml:mo>          <mml:mrow>            <mml:mstyle displaystyle="false" scriptlevel="0">              <mml:munderover>                <mml:mo>&#x2211;</mml:mo>                <mml:mrow>                  <mml:mi>i</mml:mi>                  <mml:mo>=</mml:mo>                  <mml:mn>1</mml:mn>                </mml:mrow>                <mml:mrow>                  <mml:mi>N</mml:mi>                </mml:mrow>              </mml:munderover>              <mml:msub>                <mml:mi>y</mml:mi>                <mml:mrow>                  <mml:mi>i</mml:mi>                </mml:mrow>              </mml:msub>              <mml:msup>                <mml:mo stretchy="false">)</mml:mo>                <mml:mrow>                  <mml:mn>2</mml:mn>                </mml:mrow>              </mml:msup>              <mml:mo>+</mml:mo>              <mml:mtext>smooth</mml:mtext>            </mml:mstyle>          </mml:mrow>        </mml:mstyle>      </mml:mrow>    </mml:mrow>  </mml:mfrac></mml:math></disp-formula>
<p id="p-23">where the equation represents an improvement over the standard Dice loss by placing greater emphasis on the squared terms of intersections and unions.</p>
<disp-formula id="eq4"><label>(4)</label><mml:math id="m4" display="block"><mml:mtext>Base</mml:mtext><mml:mtext>_</mml:mtext><mml:mtext>loss</mml:mtext><mml:mo>=</mml:mo><mml:mtext>BCE</mml:mtext><mml:mo>+</mml:mo><mml:mtext>Dice Loss</mml:mtext><mml:mo>+</mml:mo><mml:mtext>Square Dice Loss</mml:mtext></mml:math></disp-formula>
<p id="p-24">
<xref ref-type="disp-formula" rid="eq1">Equations 1</xref>, <xref ref-type="disp-formula" rid="eq2">2</xref>, and <xref ref-type="disp-formula" rid="eq3">3</xref> define the base loss function (<xref ref-type="disp-formula" rid="eq4">Equation 4</xref>) for our proposed model, incorporating the Dice loss, and square Dice loss components. <italic>λ<sub>i</sub></italic> represents the weight assigned to different stages. We explore adding the difference between the up-sample from the stage with ground truth to the final loss. Because the large stage’s result should be close to the final prediction, we set <italic>λ<sub>i</sub></italic> to 0.1, 0.2, 0.3, 0.4, and 0.5 based on the i-th stage, as illustrated in <xref ref-type="fig" rid="fig3">Figure 3</xref>.</p>
<p id="p-25">
<xref ref-type="disp-formula" rid="eq7">Equation 7</xref> defines our proposed group loss function, which calculates the loss based on the scaled layer masks at various stages compared to the ground truth masks. <xref ref-type="disp-formula" rid="eq5">Equations 5</xref> and <xref ref-type="disp-formula" rid="eq6">6</xref> detail the stage loss for different intermediate layers and the output loss for the final layer, respectively.</p>
<disp-formula id="eq5"><label>(5)</label><mml:math id="m5" display="block">  <mml:mi>L</mml:mi>  <mml:mi>o</mml:mi>  <mml:mi>s</mml:mi>  <mml:msub>    <mml:mi>s</mml:mi>    <mml:mrow>      <mml:mi>S</mml:mi>      <mml:mi>t</mml:mi>      <mml:mi>a</mml:mi>      <mml:mi>g</mml:mi>      <mml:mi>e</mml:mi>    </mml:mrow>  </mml:msub>  <mml:mo>=</mml:mo>  <mml:mtext>Base_loss</mml:mtext>  <mml:mo stretchy="false">(</mml:mo>  <mml:mi>S</mml:mi>  <mml:mi>t</mml:mi>  <mml:mi>a</mml:mi>  <mml:mi>g</mml:mi>  <mml:mi>e</mml:mi>  <mml:mi>P</mml:mi>  <mml:mi>r</mml:mi>  <mml:mi>e</mml:mi>  <mml:mi>d</mml:mi>  <mml:mo>,</mml:mo>  <mml:mi>T</mml:mi>  <mml:mi>a</mml:mi>  <mml:mi>r</mml:mi>  <mml:mi>g</mml:mi>  <mml:mi>e</mml:mi>  <mml:mi>t</mml:mi>  <mml:mo stretchy="false">)</mml:mo></mml:math></disp-formula>
<disp-formula id="eq6"><label>(6)</label><mml:math id="m6" display="block">  <mml:mi>L</mml:mi>  <mml:mi>o</mml:mi>  <mml:mi>s</mml:mi>  <mml:msub>    <mml:mi>s</mml:mi>    <mml:mrow>      <mml:mi>O</mml:mi>      <mml:mi>u</mml:mi>      <mml:mi>t</mml:mi>      <mml:mi>p</mml:mi>      <mml:mi>u</mml:mi>      <mml:mi>t</mml:mi>    </mml:mrow>  </mml:msub>  <mml:mo>=</mml:mo>  <mml:mtext>Base_loss</mml:mtext>  <mml:mo stretchy="false">(</mml:mo>  <mml:mi>O</mml:mi>  <mml:mi>u</mml:mi>  <mml:mi>t</mml:mi>  <mml:mi>p</mml:mi>  <mml:mi>u</mml:mi>  <mml:mi>t</mml:mi>  <mml:mi>P</mml:mi>  <mml:mi>r</mml:mi>  <mml:mi>e</mml:mi>  <mml:mi>d</mml:mi>  <mml:mo>,</mml:mo>  <mml:mi>T</mml:mi>  <mml:mi>a</mml:mi>  <mml:mi>r</mml:mi>  <mml:mi>g</mml:mi>  <mml:mi>e</mml:mi>  <mml:mi>t</mml:mi>  <mml:mo stretchy="false">)</mml:mo></mml:math></disp-formula>
<disp-formula id="eq7"><label>(7)</label><mml:math id="m7" display="block">  <mml:mi>G</mml:mi>  <mml:mi>r</mml:mi>  <mml:mi>o</mml:mi>  <mml:mi>u</mml:mi>  <mml:mi>p</mml:mi><mml:mo>_</mml:mo><mml:mi>L</mml:mi>  <mml:mi>o</mml:mi>  <mml:mi>s</mml:mi>  <mml:mi>s</mml:mi>  <mml:mo>=</mml:mo>  <mml:mi>L</mml:mi>  <mml:mi>o</mml:mi>  <mml:mi>s</mml:mi>  <mml:msub>    <mml:mi>s</mml:mi>    <mml:mrow>      <mml:mi>O</mml:mi>      <mml:mi>u</mml:mi>      <mml:mi>t</mml:mi>      <mml:mi>p</mml:mi>      <mml:mi>u</mml:mi>      <mml:mi>t</mml:mi>    </mml:mrow>  </mml:msub>  <mml:mo>+</mml:mo>  <mml:munderover>    <mml:mo>&#x2211;</mml:mo>    <mml:mrow>      <mml:mi>i</mml:mi>      <mml:mo>=</mml:mo>      <mml:mn>1</mml:mn>    </mml:mrow>    <mml:mrow>      <mml:mi>5</mml:mi>    </mml:mrow>  </mml:munderover>  <mml:msub>    <mml:mi>&#x3BB;</mml:mi>    <mml:mrow>      <mml:mi>i</mml:mi>    </mml:mrow>  </mml:msub>  <mml:mo>&#xD7;</mml:mo>  <mml:mi>L</mml:mi>  <mml:mi>o</mml:mi>  <mml:mi>s</mml:mi>  <mml:msub>    <mml:mi>s</mml:mi>    <mml:mrow>      <mml:mi>S</mml:mi>      <mml:mi>t</mml:mi>      <mml:mi>a</mml:mi>      <mml:mi>g</mml:mi>      <mml:msub>        <mml:mi>e</mml:mi>        <mml:mrow>          <mml:mi>i</mml:mi>        </mml:mrow>      </mml:msub>    </mml:mrow>  </mml:msub></mml:math></disp-formula>
<p id="p-26">To prove the effectiveness of our proposed methods, we did an ablation experiment of various base loss functions and the experimental results are reported in the following <xref ref-type="sec" rid="s4">Discussion</xref> section.</p>
</sec>
</sec>
<sec id="s3">
<title>Results</title>
<p id="p-27">Datasets: To evaluate the efficiency and performance of our proposed model with other published models, we picked the two public skin segmentation datasets from the ISIC, namely ISIC2017 and ISIC2018. The ISIC2017 dataset contains 2,000 dermoscopy images, while the ISIC2018 dataset includes 2,594 images. The ISIC2017 dataset was randomly divided into 1,250 for training, 150 for validation, and 600 for testing. The ISIC2018 dataset was randomly divided into 1,815 for training, 259 for validation, and 520 for testing.</p>
<p id="p-28">Evaluation setting: Our MUCM-Net is implemented with the PyTorch [<xref ref-type="bibr" rid="B40">40</xref>] framework. All experiments are conducted on the instance node at Lambda [<xref ref-type="bibr" rid="B41">41</xref>] that has a single NVIDIA RTX A6000 GPU (24 GB), 14vCPUs, 46 GiB RAM, and 512 GiB SSD. We normalized and resized the images to 256 × 256 pixels. To enhance data sample diversity, we applied basic data augmentations, including horizontal and vertical flipping, as well as random rotation. This is because, although there are various and effective image augmentation techniques in the current literature [<xref ref-type="bibr" rid="B42">42</xref>], they may lead to an increase in the computational cost. We selected AdamW [<xref ref-type="bibr" rid="B43">43</xref>] for the optimizer, initialized with a learning rate of 0.001 and a weight decay of 0.01. The CosineAnnealingLR scheduler [<xref ref-type="bibr" rid="B44">44</xref>] is used with a maximum number of iterations set to 50 and a minimum learning rate of 1e-5. The model is trained for a total of 200 epochs with a training batch size of 8 and a testing batch size of 1.</p>
<p id="p-29">Evaluation metrics: The model’s performance is evaluated using the Dice Similarity Coefficient (DSC), sensitivity (SE), specificity (SP), and accuracy (ACC). Furthermore, the model’s memory consumption is assessed based on the number of parameters and GFLOPS. DSC measures the degree of similarity between the ground truth and the predicted segmentation map. SE is used to measure the percentage of true positives in relation to the sum of true positives and false negatives. SP measures the percentage of true negatives in relation to the sum of true negatives and false positives. ACC measures the overall percentage of correct classifications. The formulas used are as follows:</p>
<disp-formula id="eq8"><label>(8)</label><mml:math id="m8" display="block"><mml:mtext>DSC</mml:mtext><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mn>2</mml:mn><mml:mo>×</mml:mo><mml:mi>T</mml:mi><mml:mi>P</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn><mml:mo>×</mml:mo><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mo>+</mml:mo><mml:mi>F</mml:mi><mml:mi>P</mml:mi><mml:mo>+</mml:mo><mml:mi>F</mml:mi><mml:mi>N</mml:mi></mml:mrow></mml:mfrac></mml:math></disp-formula>
<disp-formula id="eq9"><label>(9)</label><mml:math id="m9" display="block"><mml:mtext>ACC</mml:mtext><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mi> </mml:mi><mml:mo>+</mml:mo><mml:mi> </mml:mi><mml:mi>T</mml:mi><mml:mi>N</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mi> </mml:mi><mml:mo>+</mml:mo><mml:mi> </mml:mi><mml:mi>T</mml:mi><mml:mi>N</mml:mi><mml:mi> </mml:mi><mml:mo>+</mml:mo><mml:mi> </mml:mi><mml:mi>F</mml:mi><mml:mi>P</mml:mi><mml:mi> </mml:mi><mml:mo>+</mml:mo><mml:mi> </mml:mi><mml:mi>F</mml:mi><mml:mi>N</mml:mi></mml:mrow></mml:mfrac></mml:math></disp-formula>
<disp-formula id="eq10"><label>(10)</label><mml:math id="m10" display="block"><mml:mtext>S</mml:mtext><mml:mtext>E</mml:mtext><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mo>+</mml:mo><mml:mi>F</mml:mi><mml:mi>N</mml:mi></mml:mrow></mml:mfrac></mml:math></disp-formula>
<disp-formula id="eq11"><label>(11)</label><mml:math id="m11" display="block"><mml:mtext>SP</mml:mtext><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>T</mml:mi><mml:mi>N</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mi>N</mml:mi><mml:mo>+</mml:mo><mml:mi>F</mml:mi><mml:mi>P</mml:mi></mml:mrow></mml:mfrac></mml:math></disp-formula>
<p id="p-30">where TP denotes true positive, TN denotes true negative, FP denotes false positive, and FN denotes false negative. In our benchmark tests, we evaluate the effectiveness of our approach and contrast it with other existing high-performing models.</p>
<p id="p-31">Experiments results: <xref ref-type="table" rid="t1">Tables 1</xref> and <xref ref-type="table" rid="t2">2</xref> present the segmentation prediction performance, while <xref ref-type="table" rid="t3">Table 3</xref> provides an overview of the models’ physical performance.</p>
<table-wrap id="t1">
<label>Table 1</label>
<caption>
<p id="t1-p-1">
<bold>Comparative prediction results on the ISIC2017 dataset</bold>
</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th>
<bold>Dataset</bold>
</th>
<th>
<bold>Models</bold>
</th>
<th>
<bold>Year</bold>
</th>
<th>
<bold>DSC↑</bold>
</th>
<th>
<bold>SE↑</bold>
</th>
<th>
<bold>SP↑</bold>
</th>
<th>
<bold>ACC↑</bold>
</th>
</tr>
</thead>
<tbody>
<tr>
<td rowspan="17">ISIC2017</td>
<td>U-Net<sup>*</sup></td>
<td>2015</td>
<td>0.8989</td>
<td>0.8793</td>
<td>0.9812</td>
<td>0.9613</td>
</tr>
<tr>
<td>SCR-Net<sup>*</sup></td>
<td>2021</td>
<td>0.8898</td>
<td>0.8497</td>
<td>0.9853</td>
<td>0.9588</td>
</tr>
<tr>
<td>C<sup>2</sup>SDG<sup>*</sup></td>
<td>2021</td>
<td>0.8938</td>
<td>0.8859</td>
<td>0.9765</td>
<td>0.9588</td>
</tr>
<tr>
<td>ATTENTION SWIN U-NET<sup>*</sup></td>
<td>2022</td>
<td>0.8859</td>
<td>0.8492</td>
<td>0.9847</td>
<td>0.9591</td>
</tr>
<tr>
<td>MALUNet<sup>*</sup></td>
<td>2022</td>
<td>0.8896</td>
<td>0.8824</td>
<td>0.9762</td>
<td>0.9583</td>
</tr>
<tr>
<td>UNeXt-S<sup>#</sup></td>
<td>2022</td>
<td>0.9017</td>
<td>0.8894</td>
<td>0.9806</td>
<td>0.9633</td>
</tr>
<tr>
<td>EGE-UNet<sup>*</sup></td>
<td>2023</td>
<td>0.9073</td>
<td>0.8931</td>
<td>0.9816</td>
<td>0.9642</td>
</tr>
<tr>
<td>VM-UNet<sup>*</sup></td>
<td>2024</td>
<td>0.9070</td>
<td>0.8837</td>
<td>0.9842</td>
<td>0.9645</td>
</tr>
<tr>
<td>VM-UNet v2<sup>*</sup></td>
<td>2024</td>
<td>0.9045</td>
<td>0.8768</td>
<td>0.9849</td>
<td>0.9637</td>
</tr>
<tr>
<td>LightM-UNet<sup>*</sup></td>
<td>2024</td>
<td>0.9080</td>
<td>0.8839</td>
<td>0.9846</td>
<td>0.9649</td>
</tr>
<tr>
<td>UltraLight VM-UNet<sup>*</sup></td>
<td>2024</td>
<td>0.9091</td>
<td>0.9053</td>
<td>0.9790</td>
<td>0.9646</td>
</tr>
<tr>
<td>UltraLight VM-UNet<sup>#</sup></td>
<td>2024</td>
<td>0.9097</td>
<td>0.9042</td>
<td>0.9804</td>
<td>0.9660</td>
</tr>
<tr>
<td>UCM-Net (Baseline)</td>
<td>2024</td>
<td>0.9120</td>
<td>0.8824</td>
<td>0.9877</td>
<td>0.9678</td>
</tr>
<tr>
<td>MUCM-Net (1-patch)</td>
<td>2024</td>
<td>0.9160</td>
<td>0.9090</td>
<td>0.9869</td>
<td>0.9689</td>
</tr>
<tr>
<td>MUCM-Net (2-patch)</td>
<td>2024</td>
<td>0.9126</td>
<td>0.9008</td>
<td>0.9829</td>
<td>0.9679</td>
</tr>
<tr>
<td>MUCM-Net (4-patch)</td>
<td>2024</td>
<td>0.9133</td>
<td>0.8871</td>
<td>0.9870</td>
<td>0.9681</td>
</tr>
<tr>
<td>MUCM-Net (8-patch)</td>
<td>2024</td>
<td>0.9185</td>
<td>0.9014</td>
<td>0.9857</td>
<td>0.9697</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p id="t1-fn-1">
<sup>*</sup> the results cited from UltraLight VM-Net; <sup>#</sup> the results tested by us. ISIC: International Skin Imaging Collaboration; DSC: Dice Similarity Coefficient; SE: sensitivity; SP: specificity; ACC: accuracy. ↑: the higher the value, the better the performance</p>
</fn>
</table-wrap-foot>
</table-wrap>
<table-wrap id="t2">
<label>Table 2</label>
<caption>
<p id="t2-p-1">
<bold>Comparative prediction results on the ISIC2018</bold>
</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th>
<bold>Dataset</bold>
</th>
<th>
<bold>Models</bold>
</th>
<th>
<bold>Year</bold>
</th>
<th>
<bold>DSC↑</bold>
</th>
<th>
<bold>SE↑</bold>
</th>
<th>
<bold>SP↑</bold>
</th>
<th>
<bold>ACC↑</bold>
</th>
</tr>
</thead>
<tbody>
<tr>
<td rowspan="17">ISIC2018</td>
<td>U-Net<sup>*</sup></td>
<td>2015</td>
<td>0.8851</td>
<td>0.8735</td>
<td>0.9744</td>
<td>0.9539</td>
</tr>
<tr>
<td>SCR-Net<sup>*</sup></td>
<td>2021</td>
<td>0.8886</td>
<td>0.8892</td>
<td>0.9714</td>
<td>0.9547</td>
</tr>
<tr>
<td>C<sup>2</sup>SDG<sup>*</sup></td>
<td>2021</td>
<td>0.8806</td>
<td>0.8970</td>
<td>0.9643</td>
<td>0.9506</td>
</tr>
<tr>
<td>ATTENTION SWIN U-NET<sup>*</sup></td>
<td>2022</td>
<td>0.8540</td>
<td>0.8057</td>
<td>0.9826</td>
<td>0.9480</td>
</tr>
<tr>
<td>MALUNet<sup>*</sup></td>
<td>2022</td>
<td>0.8931</td>
<td>0.8890</td>
<td>0.9725</td>
<td>0.9548</td>
</tr>
<tr>
<td>UNeXt-S<sup>#</sup></td>
<td>2022</td>
<td>0.8910</td>
<td>0.8577</td>
<td>0.9818</td>
<td>0.9555</td>
</tr>
<tr>
<td>EGE-UNet<sup>*</sup></td>
<td>2023</td>
<td>0.8819</td>
<td>0.9009</td>
<td>0.9638</td>
<td>0.9510</td>
</tr>
<tr>
<td>VM-UNet<sup>*</sup></td>
<td>2024</td>
<td>0.8891</td>
<td>0.8809</td>
<td>0.9743</td>
<td>0.9554</td>
</tr>
<tr>
<td>VM-UNet v2<sup>*</sup></td>
<td>2024</td>
<td>0.8902</td>
<td>0.8959</td>
<td>0.9702</td>
<td>0.9551</td>
</tr>
<tr>
<td>LightM-UNet<sup>*</sup></td>
<td>2024</td>
<td>0.8898</td>
<td>0.8829</td>
<td>0.9765</td>
<td>0.9555</td>
</tr>
<tr>
<td>UltraLight VM-UNet<sup>*</sup></td>
<td>2024</td>
<td>0.8940</td>
<td>0.8680</td>
<td>0.9781</td>
<td>0.9558</td>
</tr>
<tr>
<td>UltraLight VM-UNet<sup>#</sup></td>
<td>2024</td>
<td>0.8905</td>
<td>0.8724</td>
<td>0.9766</td>
<td>0.9545</td>
</tr>
<tr>
<td>UCM-Net (Baseline)</td>
<td>2024</td>
<td>0.9060</td>
<td>0.9041</td>
<td>0.9753</td>
<td>0.9602</td>
</tr>
<tr>
<td>MUCM-Net (1-patch)</td>
<td>2024</td>
<td>0.9111</td>
<td>0.8953</td>
<td>0.9811</td>
<td>0.9629</td>
</tr>
<tr>
<td>MUCM-Net (2-patch)</td>
<td>2024</td>
<td>0.9040</td>
<td>0.9151</td>
<td>0.9706</td>
<td>0.9588</td>
</tr>
<tr>
<td>MUCM-Net (4-patch)</td>
<td>2024</td>
<td>0.9058</td>
<td>0.8752</td>
<td>0.9846</td>
<td>0.9614</td>
</tr>
<tr>
<td>MUCM-Net (8-patch)</td>
<td>2024</td>
<td>0.9095</td>
<td>0.9046</td>
<td>0.9772</td>
<td>0.9618</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p id="t2-fn-1">
<sup>*</sup> the results cited from UltraLight VM-Net; <sup>#</sup> the results tested by us. ISIC: International Skin Imaging Collaboration; DSC: Dice Similarity Coefficient; SE: sensitivity; SP: specificity; ACC: accuracy. ↑: the higher the value, the better the performance</p>
</fn>
</table-wrap-foot>
</table-wrap>
<table-wrap id="t3">
<label>Table 3</label>
<caption>
<p id="t3-p-1">
<bold>Comparative performance results on models’ computations and the number of parameters</bold>
</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th>
<bold>Models</bold>
</th>
<th>
<bold>Year</bold>
</th>
<th>
<bold>Params (millions)↓</bold>
</th>
<th>
<bold>GFLOPS↓</bold>
</th>
</tr>
</thead>
<tbody>
<tr>
<td>U-Net</td>
<td>2015</td>
<td>2.009</td>
<td>3.224</td>
</tr>
<tr>
<td>SCR-Net</td>
<td>2021</td>
<td>0.801</td>
<td>1.567</td>
</tr>
<tr>
<td>C<sup>2</sup>SDG</td>
<td>2021</td>
<td>22.001</td>
<td>7.972</td>
</tr>
<tr>
<td>ATTENTION SWIN U-NET</td>
<td>2022</td>
<td>46.91</td>
<td>14.181</td>
</tr>
<tr>
<td>MALUNet</td>
<td>2022</td>
<td>0.175</td>
<td>0.083</td>
</tr>
<tr>
<td>UNeXt-S</td>
<td>2022</td>
<td>0.253</td>
<td>0.104</td>
</tr>
<tr>
<td>EGE-UNet</td>
<td>2023</td>
<td>0.053</td>
<td>0.072</td>
</tr>
<tr>
<td>VM-UNet</td>
<td>2024</td>
<td>27.427</td>
<td>4.112</td>
</tr>
<tr>
<td>VM-UNet v2</td>
<td>2024</td>
<td>22.771</td>
<td>4.400</td>
</tr>
<tr>
<td>LightM-UNet</td>
<td>2024</td>
<td>0.403</td>
<td>0.391</td>
</tr>
<tr>
<td>UltraLight VM-UNet</td>
<td>2024</td>
<td>0.049</td>
<td>0.065</td>
</tr>
<tr>
<td>UCM-Net (Baseline)</td>
<td>2024</td>
<td>0.047</td>
<td>0.045</td>
</tr>
<tr>
<td>MUCM-Net (1-patch)</td>
<td>2024</td>
<td>0.139</td>
<td>0.064</td>
</tr>
<tr>
<td>MUCM-Net (2-patch)</td>
<td>2024</td>
<td>0.100</td>
<td>0.059</td>
</tr>
<tr>
<td>MUCM-Net (4-patch)</td>
<td>2024</td>
<td>0.081</td>
<td>0.057</td>
</tr>
<tr>
<td>MUCM-Net (8-patch)</td>
<td>2024</td>
<td>0.071</td>
<td>0.055</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p id="t3-fn-1">GFLOPS: Giga Floating-point Operations Per Second. ↓: the lower the value, the better the performance</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s4">
<title>Discussion</title>
<sec id="t4-1">
<title>Experimental result analysis</title>
<p id="p-32">
<xref ref-type="table" rid="t1">Tables 1</xref> and <xref ref-type="table" rid="t2">2</xref> provide a thorough evaluation of the prediction performance of MUCM-Net, our novel Mamba-based skin lesion segmentation model, in comparison to established models. This assessment is conducted using the widely recognized ISIC2017 and ISIC2018 datasets. Introduced in 2024, MUCM-Net proves to be a robust and highly competitive solution in this domain. The key takeaway from these Tables is MUCM-Net’s ability to outperform all previous models, establishing a new state-of-the-art for lightweight skin lesion segmentation. Our model presents exceptional performance across various prediction metrics, underscoring its advancement in the field and potential to redefine the standard for accurate skin lesion delineation. To assess the physical performance of our proposed model, we compared its computational aspects and number of parameters with those of different segmentation models, as shown in <xref ref-type="table" rid="t3">Table 3</xref>. Remarkably, MUCM-Net (8-patch) operates with lower GFLOPS compared to other Mamba-based models. This efficiency does not come at the cost of performance, as MUCM-Net maintains high accuracy and robustness in segmentation tasks with the Mamba structure.</p>
</sec>
<sec id="t4-2">
<title>Ablation experiment on loss functions</title>
<p id="p-33">To prove the effects of our proposed loss function, we conducted an ablation experiment using different base loss functions to train our model, MUCM-Net (1-patch). <xref ref-type="table" rid="t4">Table 4</xref> presents the experimental results on the ISIC2017 dataset, providing a comparative analysis of the performance metrics for each loss function. The base loss functions evaluated include BCE loss (A), Dice loss (B), and square Dice loss (C). Additionally, combinations of these loss functions were tested: A + B, A + C, B + C, and A + B + C. The performance metrics considered were the DSC, SE, SP, and ACC. The training settings and hardware environment are the same as the benchmarks in <xref ref-type="table" rid="t1">Tables 1</xref> and <xref ref-type="table" rid="t2">2</xref>.</p>
<table-wrap id="t4">
<label>Table 4</label>
<caption>
<p id="t4-p-1">
<bold>Ablation experiments on loss functions</bold>
</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th>
<bold>Dataset</bold>
</th>
<th>
<bold>Base loss function</bold>
</th>
<th>
<bold>DSC↑</bold>
</th>
<th>
<bold>SE↑</bold>
</th>
<th>
<bold>SP↑</bold>
</th>
<th>
<bold>ACC↑</bold>
</th>
</tr>
</thead>
<tbody>
<tr>
<td rowspan="7">ISIC2017</td>
<td>BCE loss (A)</td>
<td>0.9130</td>
<td>0.8878</td>
<td>0.9867</td>
<td>0.9680</td>
</tr>
<tr>
<td>Dice loss (B)</td>
<td>0.9152</td>
<td>0.9008</td>
<td>0.9814</td>
<td>0.9681</td>
</tr>
<tr>
<td>Square Dice loss (C)</td>
<td>0.9155</td>
<td>0.9051</td>
<td>0.9831</td>
<td>0.9684</td>
</tr>
<tr>
<td>A + B</td>
<td>0.9147</td>
<td>0.9078</td>
<td>0.9820</td>
<td>0.9680</td>
</tr>
<tr>
<td>A + C</td>
<td>0.9158</td>
<td>0.9010</td>
<td>0.9858</td>
<td>0.9677</td>
</tr>
<tr>
<td>B + C</td>
<td>0.9101</td>
<td>0.8854</td>
<td>0.9859</td>
<td>0.9669</td>
</tr>
<tr>
<td>A + B + C (our proposed)</td>
<td>0.9160</td>
<td>0.9089</td>
<td>0.9868</td>
<td>0.9690</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p id="t4-fn-1">ISIC: International Skin Imaging Collaboration; BCE: Binary Cross-Entropy; DSC: Dice Similarity Coefficient; SE: sensitivity; SP: specificity; ACC: accuracy. ↑: the higher the value, the better the performance</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p id="p-34">
<xref ref-type="table" rid="t4">Table 4</xref> reveals that individual loss functions and their combinations exhibit varying performance on the ISIC2017 dataset. Among the individual loss functions, BCE loss (A) demonstrates a solid overall performance with a high SP of 0.9867 and ACC of 0.9680. However, its SE is relatively lower at 0.8878. Dice loss (B) improves SE to 0.9008 and maintains high ACC (0.9681), while square Dice loss (C) further enhances SE to 0.9051 and retains high SP (0.9831) and ACC (0.9684). Combinations of these loss functions generally yield better results, with A + B and A + C showing improvements in DSC and SE. The proposed combination of A + B + C achieves the best overall performance, with the highest DSC (0.9160), SE (0.9089), SP (0.9868), and ACC (0.9690). This indicates that integrating all three loss functions leverages their strengths, resulting in a more robust model performance across all evaluation metrics.</p>
<p id="p-35">In conclusion, this paper introduces MUCM-Net, an innovative and efficient solution that integrates CNN, MLP, and Mamba to offer robust feature learning while keeping parameter counts low and computational demands minimal. Applied to the challenging task of skin lesion segmentation, MUCM-Net has been rigorously tested across various evaluation metrics, demonstrating superior performance compared to other recent lightweight or Mamba-based models.</p>
<p id="p-36">Looking ahead, we plan to extend the application of MUCM-Net to other critical medical imaging tasks, aiming to advance the field and explore its potential across a broader range of healthcare applications. Additionally, we plan to explore how MUCM-Net can be effectively integrated with established hand-crafted segmentation methods (e.g., from [<xref ref-type="bibr" rid="B45">45</xref>, <xref ref-type="bibr" rid="B46">46</xref>]) to leverage their complementary strengths and potentially achieve even higher segmentation accuracy. We will also investigate methods to address adversarial noise attacks on skin cancer segmentation models [<xref ref-type="bibr" rid="B47">47</xref>, <xref ref-type="bibr" rid="B48">48</xref>], enhancing MUCM-Net’s robustness against potential manipulations that could compromise its performance. Our goal is to push the boundaries of deep learning in healthcare applications, making significant contributions to medical imaging as well as other areas of healthcare.</p>
</sec>
</sec>
</body>
<back>
<glossary>
<title>Abbreviations</title>
<def-list>
<def-item>
<term>ACC</term>
<def>
<p>accuracy</p>
</def>
</def-item>
<def-item>
<term>AI</term>
<def>
<p>artificial intelligence</p>
</def>
</def-item>
<def-item>
<term>BCE</term>
<def>
<p>Binary Cross-Entropy</p>
</def>
</def-item>
<def-item>
<term>CNNs</term>
<def>
<p>Convolutional Neural Networks</p>
</def>
</def-item>
<def-item>
<term>DSC</term>
<def>
<p>Dice Similarity Coefficient</p>
</def>
</def-item>
<def-item>
<term>GFLOPS</term>
<def>
<p>Giga Floating-point Operations Per Second</p>
</def>
</def-item>
<def-item>
<term>ISIC</term>
<def>
<p>International Skin Imaging Collaboration</p>
</def>
</def-item>
<def-item>
<term>MLPs</term>
<def>
<p>multi-layer perceptions</p>
</def>
</def-item>
<def-item>
<term>SE</term>
<def>
<p>sensitivity</p>
</def>
</def-item>
<def-item>
<term>SP</term>
<def>
<p>specificity</p>
</def>
</def-item>
<def-item>
<term>SSMs</term>
<def>
<p>state-space models</p>
</def>
</def-item>
<def-item>
<term>TinyML</term>
<def>
<p>tiny machine learning</p>
</def>
</def-item>
</def-list>
</glossary>
<sec id="s-suppl" sec-type="supplementary-material">
<title>Supplementary materials</title>
<p>The supplementary figures for this article are available at: <uri xlink:href="https://www.explorationpub.com/uploads/Article/file/1001250_sup_1.pdf">https://www.explorationpub.com/uploads/Article/file/1001250_sup_1.pdf</uri>.</p>
<supplementary-material id="SD1" content-type="local-data">
<media xlink:href="1001250_sup_1.pdf" mimetype="application" mime-subtype="pdf"></media>
</supplementary-material>
</sec>
<sec id="s6">
<title>Declarations</title>
<sec id="t-6-1">
<title>Author contributions</title>
<p>CY: Conceptualization, Investigation, Writing—original draft, Writing—review &amp; editing. DZ: Validation, Writing—review &amp; editing. SSA: Validation, Writing—review &amp; editing, Supervision. All authors read and approved the submitted version.</p>
</sec>
<sec id="t-6-2" sec-type="COI-statement">
<title>Conflicts of interest</title>
<p>The authors declare that they have no conflicts of interest.</p>
</sec>
<sec id="t-6-3">
<title>Ethical approval</title>
<p>Not applicable.</p>
</sec>
<sec id="t-6-4">
<title>Consent to participate</title>
<p>Not applicable.</p>
</sec>
<sec id="t-6-5">
<title>Consent to publication</title>
<p>Not applicable.</p>
</sec>
<sec id="t-6-6" sec-type="data-availability">
<title>Availability of data and materials</title>
<p>The datasets analyzed for this study can be found in ISIC17 Dataset: <uri xlink:href="https://challenge.isic-archive.com/data/#2017">https://challenge.isic-archive.com/data/#2017</uri>; ISIC18 Dataset: <uri xlink:href="https://challenge.isic-archive.com/data/#2018">https://challenge.isic-archive.com/data/#2018</uri>; Code Repo: <uri xlink:href="https://github.com/chunyuyuan/MUCM-Net">https://github.com/chunyuyuan/MUCM-Net</uri>.</p>
</sec>
<sec id="t-6-7">
<title>Funding</title>
<p>Not applicable.</p>
</sec>
<sec id="t-6-8">
<title>Copyright</title>
<p>© The Author(s) 2024.</p>
</sec>
</sec>
<ref-list>
<ref id="B1">
<label>1</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brown</surname>
<given-names>SL</given-names>
</name>
<name>
<surname>Fisher</surname>
<given-names>P</given-names>
</name>
<name>
<surname>Hope-Stone</surname>
<given-names>L</given-names>
</name>
<name>
<surname>Damato</surname>
<given-names>B</given-names>
</name>
<name>
<surname>Heimann</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Hussain</surname>
<given-names>R</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Fear of cancer recurrence and adverse cancer treatment outcomes: predicting 2- to 5-year fear of recurrence from post-treatment symptoms and functional problems in uveal melanoma survivors</article-title>
<source>J Cancer Surviv</source>
<year iso-8601-date="2023">2023</year>
<volume>17</volume>
<fpage>187</fpage>
<lpage>96</lpage>
<pub-id pub-id-type="doi">10.1007/s11764-021-01129-0</pub-id>
<pub-id pub-id-type="pmid">34850324</pub-id>
</element-citation>
</ref>
<ref id="B2">
<label>2</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Siegel</surname>
<given-names>RL</given-names>
</name>
<name>
<surname>Miller</surname>
<given-names>KD</given-names>
</name>
<name>
<surname>Wagle</surname>
<given-names>NS</given-names>
</name>
<name>
<surname>Jemal</surname>
<given-names>A</given-names>
</name>
</person-group>
<article-title>Cancer statistics, 2023</article-title>
<source>CA Cancer J Clin</source>
<year iso-8601-date="2023">2023</year>
<volume>73</volume>
<fpage>17</fpage>
<lpage>48</lpage>
<pub-id pub-id-type="doi">10.3322/caac.21763</pub-id>
<pub-id pub-id-type="pmid">36633525</pub-id>
</element-citation>
</ref>
<ref id="B3">
<label>3</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Marks</surname>
<given-names>R</given-names>
</name>
</person-group>
<article-title>An overview of skin cancers</article-title>
<source>Cancer</source>
<year iso-8601-date="1995">1995</year>
<volume>75</volume>
<fpage>607</fpage>
<lpage>12</lpage>
<pub-id pub-id-type="doi">10.1002/1097-0142(19950115)75:2+&lt;607::aid-cncr2820751402&gt;3.0.co;2-8</pub-id>
<pub-id pub-id-type="pmid">7804986</pub-id>
</element-citation>
</ref>
<ref id="B4">
<label>4</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lehmann</surname>
<given-names>TM</given-names>
</name>
<name>
<surname>Gönner</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Spitzer</surname>
<given-names>K</given-names>
</name>
</person-group>
<article-title>Survey: interpolation methods in medical image processing</article-title>
<source>IEEE Trans Med Imaging</source>
<year iso-8601-date="1999">1999</year>
<volume>18</volume>
<fpage>1049</fpage>
<lpage>75</lpage>
<pub-id pub-id-type="doi">10.1109/42.816070</pub-id>
<pub-id pub-id-type="pmid">10661324</pub-id>
</element-citation>
</ref>
<ref id="B5">
<label>5</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goyal</surname>
<given-names>R</given-names>
</name>
<name>
<surname>Husain</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Wilson</surname>
<given-names>K</given-names>
</name>
<name>
<surname>Chopra</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Pahwa</surname>
<given-names>R</given-names>
</name>
<name>
<surname>Loganathan</surname>
<given-names>M</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Recent advancements in skin cancer treatment: a critical review</article-title>
<source>Explor Med</source>
<year iso-8601-date="2023">2023</year>
<volume>4</volume>
<fpage>782</fpage>
<lpage>812</lpage>
<pub-id pub-id-type="doi">10.37349/emed.2023.00178</pub-id>
</element-citation>
</ref>
<ref id="B6">
<label>6</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nasir</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Attique</surname>
<given-names>Khan M</given-names>
</name>
<name>
<surname>Sharif</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Lali</surname>
<given-names>IU</given-names>
</name>
<name>
<surname>Saba</surname>
<given-names>T</given-names>
</name>
<name>
<surname>Iqbal</surname>
<given-names>T</given-names>
</name>
</person-group>
<article-title>An improved strategy for skin lesion detection and classification using uniform segmentation and feature selection based approach</article-title>
<source>Microsc Res Tech</source>
<year iso-8601-date="2018">2018</year>
<volume>81</volume>
<fpage>528</fpage>
<lpage>43</lpage>
<pub-id pub-id-type="doi">10.1002/jemt.23009</pub-id>
<pub-id pub-id-type="pmid">29464868</pub-id>
</element-citation>
</ref>
<ref id="B7">
<label>7</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Barata</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Celebi</surname>
<given-names>ME</given-names>
</name>
<name>
<surname>Marques</surname>
<given-names>JS</given-names>
</name>
</person-group>
<article-title>Explainable skin lesion diagnosis using taxonomies</article-title>
<source>Pattern Recognit</source>
<year iso-8601-date="2021">2021</year>
<volume>110</volume>
<elocation-id>107413</elocation-id>
<pub-id pub-id-type="doi">10.1016/j.patcog.2020.107413</pub-id>
</element-citation>
</ref>
<ref id="B8">
<label>8</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hosny</surname>
<given-names>KM</given-names>
</name>
<name>
<surname>Elshoura</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Mohamed</surname>
<given-names>ER</given-names>
</name>
<name>
<surname>Vrochidou</surname>
<given-names>E</given-names>
</name>
<name>
<surname>Papakostas</surname>
<given-names>GA</given-names>
</name>
</person-group>
<article-title>Deep Learning and Optimization-Based Methods for Skin Lesions Segmentation: A Review</article-title>
<source>IEEE Access</source>
<year iso-8601-date="2023">2023</year>
<volume>11</volume>
<fpage>85467</fpage>
<lpage>88</lpage>
<pub-id pub-id-type="doi">10.1109/ACCESS.2023.3303961</pub-id>
</element-citation>
</ref>
<ref id="B9">
<label>9</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>HY</given-names>
</name>
<name>
<surname>Hsiao</surname>
<given-names>YP</given-names>
</name>
<name>
<surname>Karmakar</surname>
<given-names>R</given-names>
</name>
<name>
<surname>Mukundan</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Chaudhary</surname>
<given-names>P</given-names>
</name>
<name>
<surname>Hsieh</surname>
<given-names>SC</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>A Review of Recent Advances in Computer-Aided Detection Methods Using Hyperspectral Imaging Engineering to Detect Skin Cancer</article-title>
<source>Cancers (Basel)</source>
<year iso-8601-date="2023">2023</year>
<volume>15</volume>
<elocation-id>5634</elocation-id>
<pub-id pub-id-type="doi">10.3390/cancers15235634</pub-id>
<pub-id pub-id-type="pmid">38067338</pub-id>
<pub-id pub-id-type="pmcid">PMC10705122</pub-id>
</element-citation>
</ref>
<ref id="B10">
<label>10</label>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Sanchez</surname>
<given-names>I</given-names>
</name>
<name>
<surname>Agaian</surname>
<given-names>S</given-names>
</name>
</person-group>
<comment>A new system of computer-aided diagnosis of skin lesions. In: Egiazarian KO, Agaian SS, Gotchev AP, Recker J, Wang G, editors. Image Processing: Algorithms and Systems X; and Parallel Processing for Imaging Applications II. IS&amp;T/SPIE Electronic Imaging; 2012 Jan 22-26; Burlingame, United States. 2012.</comment>
<pub-id pub-id-type="doi">10.1117/12.906796</pub-id>
</element-citation>
</ref>
<ref id="B11">
<label>11</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>de Carvalho</surname>
<given-names>TM</given-names>
</name>
<name>
<surname>Noels</surname>
<given-names>E</given-names>
</name>
<name>
<surname>Wakkee</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Udrea</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Nijsten</surname>
<given-names>T</given-names>
</name>
</person-group>
<article-title>Development of Smartphone Apps for Skin Cancer Risk Assessment: Progress and Promise</article-title>
<source>JMIR Dermatol</source>
<year iso-8601-date="2019">2019</year>
<volume>2</volume>
<elocation-id>e13376</elocation-id>
<pub-id pub-id-type="doi">10.2196/13376</pub-id>
</element-citation>
</ref>
<ref id="B12">
<label>12</label>
<element-citation publication-type="web">
<article-title>Butterfly iQ+<sup>TM</sup> [Internet]</article-title>
<comment>Butterfly Network, inc; c2024 [cited 2024 Jul 30]. Available from: <uri xlink:href="https://www.butterflynetwork.com/iq-plus">https://www.butterflynetwork.com/iq-plus</uri></comment>
</element-citation>
</ref>
<ref id="B13">
<label>13</label>
<element-citation publication-type="web">
<person-group person-group-type="author">
<name>
<surname>Bui</surname>
<given-names>P</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Y</given-names>
</name>
</person-group>
<article-title>Using AI to help find answers to common skin conditions [Internet]</article-title>
<comment>[cited 2024 Jul 30]. Available from: <uri xlink:href="https://blog.google/technology/health/ai-dermatology-preview-io-2021/">https://blog.google/technology/health/ai-dermatology-preview-io-2021/</uri></comment>
</element-citation>
</ref>
<ref id="B14">
<label>14</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Esteva</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Robicquet</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Ramsundar</surname>
<given-names>B</given-names>
</name>
<name>
<surname>Kuleshov</surname>
<given-names>V</given-names>
</name>
<name>
<surname>DePristo</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Chou</surname>
<given-names>K</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>A guide to deep learning in healthcare</article-title>
<source>Nat Med</source>
<year iso-8601-date="2019">2019</year>
<volume>25</volume>
<fpage>24</fpage>
<lpage>9</lpage>
<pub-id pub-id-type="doi">10.1038/s41591-018-0316-z</pub-id>
<pub-id pub-id-type="pmid">30617335</pub-id>
</element-citation>
</ref>
<ref id="B15">
<label>15</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>P</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Yi</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>H</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Deep Learning on Computational-Resource-Limited Platforms: A Survey</article-title>
<source>Mobile Inf Syst</source>
<year iso-8601-date="2020">2020</year>
<volume>2020</volume>
<elocation-id>8454327</elocation-id>
<pub-id pub-id-type="doi">10.1155/2020/8454327</pub-id>
</element-citation>
</ref>
<ref id="B16">
<label>16</label>
<element-citation publication-type="web">
<person-group person-group-type="author">
<name>
<surname>Thompson</surname>
<given-names>NC</given-names>
</name>
<name>
<surname>Greenewald</surname>
<given-names>K</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>K</given-names>
</name>
<name>
<surname>Manso</surname>
<given-names>GF</given-names>
</name>
</person-group>
<article-title>The Computational Limits of Deep Learning</article-title>
<comment>arXiv:2007.05558v1 [Preprint]. 2020 [cited 2024 Jul 30]: [46 p.]. Available from: <uri xlink:href="https://doi.org/10.48550/arXiv.2007.05558">https://doi.org/10.48550/arXiv.2007.05558</uri></comment>
</element-citation>
</ref>
<ref id="B17">
<label>17</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yuan</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Agaian</surname>
<given-names>SS</given-names>
</name>
</person-group>
<article-title>UCM-Net: A lightweight and efficient solution for skin lesion segmentation using MLP and CNN</article-title>
<source>Biomed Signal Process Control</source>
<year iso-8601-date="2024">2024</year>
<volume>96</volume>
<elocation-id>106573</elocation-id>
<pub-id pub-id-type="doi">10.1016/j.bspc.2024.106573</pub-id>
</element-citation>
</ref>
<ref id="B18">
<label>18</label>
<element-citation publication-type="web">
<article-title>ISIC Challenge [dataset]</article-title>
<comment>2017 [cited 2024 Jul 30]. Available from: <uri xlink:href="https://challenge.isic-archive.com/data/#2017">https://challenge.isic-archive.com/data/#2017</uri></comment>
</element-citation>
</ref>
<ref id="B19">
<label>19</label>
<element-citation publication-type="web">
<person-group person-group-type="author">
<name>
<surname>Berseth</surname>
<given-names>M</given-names>
</name>
</person-group>
<article-title>ISIC 2017 - Skin Lesion Analysis Towards Melanoma Detection</article-title>
<comment>arXiv:1703.00523 [Preprint]. 2017 [cited 2024 Jul 30]: [4 p.]. Available from: <uri xlink:href="https://doi.org/10.48550/arXiv.1703.00523">https://doi.org/10.48550/arXiv.1703.00523</uri></comment>
</element-citation>
</ref>
<ref id="B20">
<label>20</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tschandl</surname>
<given-names>P</given-names>
</name>
<name>
<surname>Rosendahl</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Kittler</surname>
<given-names>H</given-names>
</name>
</person-group>
<article-title>The HAM10000 dataset, a large collection of multi-source dermatoscopic images of common pigmented skin lesions</article-title>
<source>Sci Data</source>
<year iso-8601-date="2018">2018</year>
<volume>5</volume>
<elocation-id>180161</elocation-id>
<pub-id pub-id-type="doi">10.1038/sdata.2018.161</pub-id>
<pub-id pub-id-type="pmid">30106392</pub-id>
<pub-id pub-id-type="pmcid">PMC6091241</pub-id>
</element-citation>
</ref>
<ref id="B21">
<label>21</label>
<element-citation publication-type="web">
<person-group person-group-type="author">
<name>
<surname>Codella</surname>
<given-names>N</given-names>
</name>
<name>
<surname>Rotemberg</surname>
<given-names>V</given-names>
</name>
<name>
<surname>Tschandl</surname>
<given-names>P</given-names>
</name>
<name>
<surname>Celebi</surname>
<given-names>ME</given-names>
</name>
<name>
<surname>Dusza</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Gutman</surname>
<given-names>D</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Skin Lesion Analysis Toward Melanoma Detection 2018: A Challenge Hosted by the International Skin Imaging Collaboration (ISIC)</article-title>
<comment>arXiv:1902.03368 [Preprint]. 2019 [cited 2024 Jul 30]: [12 p.]. Available from: <uri xlink:href="https://doi.org/10.48550/arXiv.1902.03368">https://doi.org/10.48550/arXiv.1902.03368</uri></comment>
</element-citation>
</ref>
<ref id="B22">
<label>22</label>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Kim</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Khan</surname>
<given-names>MUK</given-names>
</name>
<name>
<surname>Kyung</surname>
<given-names>CM</given-names>
</name>
</person-group>
<comment>Efficient Neural Network Compression. In: 2019 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). Conference on Computer Vision and Pattern Recognition (CVPR); 2019 Jun 15-20; Long Beach, USA. IEEE; 2019. pp. 12561–9.</comment>
<pub-id pub-id-type="doi">10.1109/CVPR.2019.01285</pub-id>
</element-citation>
</ref>
<ref id="B23">
<label>23</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yuan</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Agaian</surname>
<given-names>SS</given-names>
</name>
</person-group>
<article-title>A comprehensive review of Binary Neural Network</article-title>
<source>Artif Intell Rev</source>
<year iso-8601-date="2023">2023</year>
<volume>56</volume>
<fpage>12949</fpage>
<lpage>3013</lpage>
<pub-id pub-id-type="doi">10.1007/s10462-023-10464-w</pub-id>
</element-citation>
</ref>
<ref id="B24">
<label>24</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>Z</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Huangfu</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Ran</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Dynamic Corrected Split Federated Learning With Homomorphic Encryption for U-Shaped Medical Image Networks</article-title>
<source>IEEE J Biomed Health Inform</source>
<year iso-8601-date="2023">2023</year>
<volume>27</volume>
<fpage>5946</fpage>
<lpage>57</lpage>
<pub-id pub-id-type="doi">10.1109/JBHI.2023.3317632</pub-id>
<pub-id pub-id-type="pmid">37729562</pub-id>
</element-citation>
</ref>
<ref id="B25">
<label>25</label>
<element-citation publication-type="web">
<person-group person-group-type="author">
<name>
<surname>Oktay</surname>
<given-names>O</given-names>
</name>
<name>
<surname>Schlemper</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Folgoc</surname>
<given-names>LL</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Heinrich</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Misawa</surname>
<given-names>K</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Attention U-Net: Learning Where to Look for the Pancreas</article-title>
<comment>arXiv:1804.03999 [Preprint]. 2018 [cited 2024 Jul 30]: [10 p.]. Available from: <uri xlink:href="https://doi.org/10.48550/arXiv.1804.03999">https://doi.org/10.48550/arXiv.1804.03999</uri></comment>
</element-citation>
</ref>
<ref id="B26">
<label>26</label>
<element-citation publication-type="web">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>Q</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>X</given-names>
</name>
<name>
<surname>Adeli</surname>
<given-names>E</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>TransUNet: Transformers Make Strong Encoders for Medical Image Segmentation</article-title>
<comment>arXiv:2102.04306 [Preprint]. 2021 [cited 2024 Jul 30]: [13 p.]. Available from: <uri xlink:href="https://doi.org/10.48550/arXiv.2102.04306">https://doi.org/10.48550/arXiv.2102.04306</uri></comment>
</element-citation>
</ref>
<ref id="B27">
<label>27</label>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>Q</given-names>
</name>
</person-group>
<comment>TransFuse: Fusing Transformers and CNNs for Medical Image Segmentation. In: de Bruijne M, Cattin PC, Cotin S, Padoy N, Speidel S, Zheng Y, et al., editors. Medical Image Computing and Computer Assisted Intervention – MICCAI 2021. International Conference on Medical Image Computing and Computer-Assisted Intervention; 2021 Sep 27-Oct 1; Strasbourg, France. Cham: Springer International Publishing; 2021. pp. 14–24.</comment>
<pub-id pub-id-type="doi">10.1007/978-3-030-87193-2_2</pub-id>
</element-citation>
</ref>
<ref id="B28">
<label>28</label>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Cao</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X</given-names>
</name>
<name>
<surname>Tian</surname>
<given-names>Q</given-names>
</name>
<etal>et al.</etal>
</person-group>
<comment>Swin-Unet: Unet-Like Pure Transformer for Medical Image Segmentation. In: Karlinsky L, Michaeli T, Nishino K, editors. Computer Vision – ECCV 2022 Workshops. European Conference on Computer Vision; 2022 Oct 23-27; Tel Aviv, Israel. Cham: Springer Nature Switzerland; 2023. pp. 205–18.</comment>
<pub-id pub-id-type="doi">10.1007/978-3-031-25066-8_9</pub-id>
</element-citation>
</ref>
<ref id="B29">
<label>29</label>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>Z</given-names>
</name>
<name>
<surname>Mao</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>CY</given-names>
</name>
<name>
<surname>Feichtenhofer</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Darrell</surname>
<given-names>T</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>S</given-names>
</name>
</person-group>
<comment>A ConvNet for the 2020s. In: 2022 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). Conference on Computer Vision and Pattern Recognition (CVPR); 2022 Jun 18-24; New Orleans, USA. IEEE; 2022. pp. 11966–76.</comment>
<pub-id pub-id-type="doi">10.1109/CVPR52688.2022.01167</pub-id>
</element-citation>
</ref>
<ref id="B30">
<label>30</label>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Valanarasu</surname>
<given-names>JMJ</given-names>
</name>
<name>
<surname>Patel</surname>
<given-names>VM</given-names>
</name>
</person-group>
<comment>UNeXt: MLP-Based Rapid Medical Image Segmentation Network. In: Wang L, Dou Q, Fletcher PT, Speidel S, Li S, editors. Medical Image Computing and Computer Assisted Intervention – MICCAI 2022. International Conference on Medical Image Computing and Computer-Assisted Intervention; 2022 Sep 18-22; Singapore, Singapore. Cham: Springer Nature Switzerland; 2022. pp. 23–33.</comment>
<pub-id pub-id-type="doi">10.1007/978-3-031-16443-9_3</pub-id>
</element-citation>
</ref>
<ref id="B31">
<label>31</label>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Ruan</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Xiang</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>T</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>Y</given-names>
</name>
</person-group>
<comment>MALUNet: A Multi-Attention and Light-weight UNet for Skin Lesion Segmentation. In: 2022 IEEE International Conference on Bioinformatics and Biomedicine (BIBM). IEEE International Conference on Bioinformatics and Biomedicine (BIBM); 2022 Dec 6-8; Las Vegas, USA. IEEE; 2022. pp. 1150–6.</comment>
<pub-id pub-id-type="doi">10.1109/BIBM55620.2022.9995040</pub-id>
</element-citation>
</ref>
<ref id="B32">
<label>32</label>
<element-citation publication-type="web">
<person-group person-group-type="author">
<name>
<surname>Ruan</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>T</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>Y</given-names>
</name>
</person-group>
<article-title>EGE-UNet: an Efficient Group Enhanced UNet for skin lesion segmentation</article-title>
<comment>arXiv:2307.08473 [Preprint]. 2023 [cited 2024 Jul 30]: [10 p.]. Available from: <uri xlink:href="https://doi.org/10.48550/arXiv.2307.08473">https://doi.org/10.48550/arXiv.2307.08473</uri></comment>
</element-citation>
</ref>
<ref id="B33">
<label>33</label>
<element-citation publication-type="web">
<person-group person-group-type="author">
<name>
<surname>Zhu</surname>
<given-names>L</given-names>
</name>
<name>
<surname>Liao</surname>
<given-names>B</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Q</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X</given-names>
</name>
</person-group>
<article-title>Vision Mamba: Efficient Visual Representation Learning with Bidirectional State Space Model</article-title>
<comment>arXiv:2401.09417 [Preprint]. 2024 [cited 2024 Jul 30]: [11 p.]. Available from: <uri xlink:href="https://doi.org/10.48550/arXiv.2401.09417">https://doi.org/10.48550/arXiv.2401.09417</uri></comment>
</element-citation>
</ref>
<ref id="B34">
<label>34</label>
<element-citation publication-type="web">
<person-group person-group-type="author">
<name>
<surname>Ruan</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Xiang</surname>
<given-names>S</given-names>
</name>
</person-group>
<article-title>VM-UNet: Vision Mamba UNet for Medical Image Segmentation</article-title>
<comment>arXiv:2402.02491 [Preprint]. 2024 [cited 2024 Jul 30]: [12 p.]. Available from: <uri xlink:href="https://doi.org/10.48550/arXiv.2402.02491">https://doi.org/10.48550/arXiv.2402.02491</uri></comment>
</element-citation>
</ref>
<ref id="B35">
<label>35</label>
<element-citation publication-type="web">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Gu</surname>
<given-names>L</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>T</given-names>
</name>
<name>
<surname>Tao</surname>
<given-names>X</given-names>
</name>
</person-group>
<article-title>VM-UNET-V2 Rethinking Vision Mamba UNet for Medical Image Segmentation</article-title>
<comment>arXiv:2403.09157 [Preprint]. 2024 [cited 2024 Jul 30]: [12 p.]. Available from: <uri xlink:href="https://doi.org/10.48550/arXiv.2403.09157">https://doi.org/10.48550/arXiv.2403.09157</uri></comment>
</element-citation>
</ref>
<ref id="B36">
<label>36</label>
<element-citation publication-type="web">
<person-group person-group-type="author">
<name>
<surname>Liao</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>L</given-names>
</name>
</person-group>
<article-title>LightM-UNet: Mamba Assists in Lightweight UNet for Medical Image Segmentation</article-title>
<comment>arXiv:2403.05246 [Preprint]. 2024 [cited 2024 Jul 30]: [10 p.]. Available from: <uri xlink:href="https://doi.org/10.48550/arXiv.2403.05246">https://doi.org/10.48550/arXiv.2403.05246</uri></comment>
</element-citation>
</ref>
<ref id="B37">
<label>37</label>
<element-citation publication-type="web">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>R</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Liang</surname>
<given-names>P</given-names>
</name>
<name>
<surname>Chang</surname>
<given-names>Q</given-names>
</name>
</person-group>
<article-title>UltraLight VM-UNet: Parallel Vision Mamba Significantly Reduces Parameters for Skin Lesion Segmentation</article-title>
<comment>arXiv:2403.20035 [Preprint]. 2024 [cited 2024 Jul 30]: [16 p.]. Available from: <uri xlink:href="https://doi.org/10.48550/arXiv.2403.20035">https://doi.org/10.48550/arXiv.2403.20035</uri></comment>
</element-citation>
</ref>
<ref id="B38">
<label>38</label>
<element-citation publication-type="web">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>X</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Ding</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Rong</surname>
<given-names>Y</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>State Space Model for New-Generation Network Alternative to Transformers: A Survey</article-title>
<comment>arXiv:2404.09516 [Preprint]. 2024 [cited 2024 Jul 30]: [33 p.]. Available from: <uri xlink:href="https://doi.org/10.48550/arXiv.2404.09516">https://doi.org/10.48550/arXiv.2404.09516</uri></comment>
</element-citation>
</ref>
<ref id="B39">
<label>39</label>
<element-citation publication-type="web">
<person-group person-group-type="author">
<name>
<surname>Gu</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Dao</surname>
<given-names>T</given-names>
</name>
</person-group>
<article-title>Mamba: Linear-Time Sequence Modeling with Selective State Spaces</article-title>
<comment>arXiv:2312.00752v1 [Preprint]. 2023 [cited 2024 Jul 30]: [37 p.]. Available from: <uri xlink:href="https://doi.org/10.48550/arXiv.2312.00752">https://doi.org/10.48550/arXiv.2312.00752</uri></comment>
</element-citation>
</ref>
<ref id="B40">
<label>40</label>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Paszke</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Gross</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Massa</surname>
<given-names>F</given-names>
</name>
<name>
<surname>Lerer</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Bradbury</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Chanan</surname>
<given-names>G</given-names>
</name>
<etal>et al.</etal>
</person-group>
<comment>PyTorch: An Imperative Style, High-Performance Deep Learning Library. In: Wallach H, Larochelle H, Beygelzimer A, d’Alché-Buc F, Fox E, Garnett R, editors. Advances in Neural Information Processing Systems. Curran Associates, Inc.; 2019.</comment>
</element-citation>
</ref>
<ref id="B41">
<label>41</label>
<element-citation publication-type="web">
<article-title>lambdalabs.com [Internet]</article-title>
<comment>c2024 [cited 2024 Aug 10]. Available from: <uri xlink:href="https://lambdalabs.com/">https://lambdalabs.com/</uri></comment>
</element-citation>
</ref>
<ref id="B42">
<label>42</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goceri</surname>
<given-names>E</given-names>
</name>
</person-group>
<article-title>Medical image data augmentation: techniques, comparisons and interpretations</article-title>
<source>Artif Intell Rev</source>
<year iso-8601-date="2023">2023</year>
<volume>56</volume>
<fpage>12561</fpage>
<lpage>605</lpage>
<pub-id pub-id-type="doi">10.1007/s10462-023-10453-z</pub-id>
<pub-id pub-id-type="pmid">37362888</pub-id>
<pub-id pub-id-type="pmcid">PMC10027281</pub-id>
</element-citation>
</ref>
<ref id="B43">
<label>43</label>
<element-citation publication-type="web">
<person-group person-group-type="author">
<name>
<surname>Loshchilov</surname>
<given-names>I</given-names>
</name>
<name>
<surname>Hutter</surname>
<given-names>F</given-names>
</name>
</person-group>
<article-title>Decoupled Weight Decay Regularization</article-title>
<comment>arXiv:1711.05101 [Preprint]. 2017 [cited 2024 Jul 30]: [19 p.]. Available from: <uri xlink:href="https://doi.org/10.48550/arXiv.1711.05101">https://doi.org/10.48550/arXiv.1711.05101</uri></comment>
</element-citation>
</ref>
<ref id="B44">
<label>44</label>
<element-citation publication-type="web">
<person-group person-group-type="author">
<name>
<surname>Loshchilov</surname>
<given-names>I</given-names>
</name>
<name>
<surname>Hutter</surname>
<given-names>F</given-names>
</name>
</person-group>
<article-title>SGDR: Stochastic Gradient Descent with Warm Restarts</article-title>
<comment>arXiv:1608.03983 [Preprint]. 2016 [cited 2024 Jul 30]: [16 p.]. Available from: <uri xlink:href="https://doi.org/10.48550/arXiv.1608.03983">https://doi.org/10.48550/arXiv.1608.03983</uri></comment>
</element-citation>
</ref>
<ref id="B45">
<label>45</label>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Sanchez</surname>
<given-names>I</given-names>
</name>
<name>
<surname>Agaian</surname>
<given-names>S</given-names>
</name>
</person-group>
<comment>Computer aided diagnosis of lesions extracted from large skin surfaces. In: 2012 IEEE International Conference on Systems, Man, and Cybernetics (SMC). IEEE International Conference on Systems, Man and Cybernetics; 2012 Oct 14-17; Seoul, Korea (South). IEEE; 2012. pp. 2879–84.</comment>
<pub-id pub-id-type="doi">10.1109/ICSMC.2012.6378186</pub-id>
</element-citation>
</ref>
<ref id="B46">
<label>46</label>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Frants</surname>
<given-names>V</given-names>
</name>
<name>
<surname>Agaian</surname>
<given-names>S</given-names>
</name>
</person-group>
<comment>Dermoscopic image segmentation based on modified GrabCut with octree color quantization. In: Agaian SS, Asari VK, DelMarco SP, Jassim SA, editors. Mobile Multimedia/Image Processing, Security, and Applications 2020. SPIE Defense + Commercial Sensing; 2020 Apr 27-May 9; California, United States. 2020.</comment>
<pub-id pub-id-type="doi">10.1117/12.2556699</pub-id>
</element-citation>
</ref>
<ref id="B47">
<label>47</label>
<element-citation publication-type="book">
<person-group person-group-type="author">
<name>
<surname>Liew</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Agaian</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>L</given-names>
</name>
</person-group>
<article-title>Mitigation of adversarial noise attacks on skin cancer detection via ordered statistics binary local features</article-title>
<person-group person-group-type="editor">
<name>
<surname>Agaian</surname>
<given-names>SS</given-names>
</name>
<name>
<surname>Asari</surname>
<given-names>VK</given-names>
</name>
<name>
<surname>DelMarco</surname>
<given-names>SP</given-names>
</name>
</person-group>
<source>Multimodal Image Exploitation and Learning 2023</source>
<comment>SPIE Defense + Commercial Sensing; 2023 Apr 30-May 5; Orlando, United States. 2023.</comment>
<pub-id pub-id-type="doi">10.1117/12.2664239</pub-id>
</element-citation>
</ref>
<ref id="B48">
<label>48</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goceri</surname>
<given-names>E</given-names>
</name>
</person-group>
<article-title>Evaluation of denoising techniques to remove speckle and Gaussian noise from dermoscopy images</article-title>
<source>Comput Biol Med</source>
<year iso-8601-date="2023">2023</year>
<volume>152</volume>
<elocation-id>106474</elocation-id>
<pub-id pub-id-type="doi">10.1016/j.compbiomed.2022.106474</pub-id>
<pub-id pub-id-type="pmid">36563540</pub-id>
</element-citation>
</ref>
</ref-list>
</back>
</article>