﻿<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.0 20120330//EN" "http://jats.nlm.nih.gov/publishing/1.0/JATS-journalpublishing1.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="nlm-ta">Intell. Robot.</journal-id>
      <journal-id journal-id-type="publisher-id">IR</journal-id>
      <journal-title-group>
        <journal-title>Intelligence &amp; Robotics</journal-title>
      </journal-title-group>
      <issn pub-type="epub">2770-3541</issn>
      <publisher>
        <publisher-name>OAE Publishing Inc.</publisher-name>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.20517/ir.2026.15</article-id>
	  <article-id pub-id-type="publisher-id">IR-2025-102101</article-id>
      <article-categories>
        <subj-group>
          <subject>Research Article</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Intelligent prediction of the remaining useful life of lithium-ion batteries based on a CGHF-MDH-Mamba model</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author" corresp="yes">
          <name>
            <surname>Li</surname>
            <given-names>Yanhao</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
          <xref ref-type="corresp" rid="cor1" />
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Zhou</surname>
            <given-names>Xin</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Zhong</surname>
            <given-names>Feng</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Han</surname>
            <given-names>Wei</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Zhang</surname>
            <given-names>Zichong</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Tong</surname>
            <given-names>Rui</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author" corresp="yes">
          <name>
            <surname>Huang</surname>
            <given-names>Lyuwen</given-names>
          </name>
          <xref ref-type="aff" rid="I2">
            <sup>2</sup>
          </xref>
          <xref ref-type="corresp" rid="cor1" />
        </contrib>
      </contrib-group>
      <aff id="I1">
        <sup>1</sup>Guangzhou Power Supply Bureau of Guangdong Power Grid Co., Ltd, Guangzhou 510623, Guangdong, China.</aff>
      <aff id="I2">
        <sup>2</sup>College of Information Engineering, Northwest A&amp;F University, Yangling 712100, Shaanxi, China.</aff>
      <author-notes>
        <corresp id="cor1">Correspondence to: Yanhao Li, Guangzhou Power Supply Bureau of Guangdong Power Grid Co., Ltd, Guangzhou 510623, Guangdong, China. E-mail: <email>liyanhao@gzps.corp.csg</email>; Dr. Lyuwen Huang, College of Information Engineering, Northwest A&amp;F University, Yangling 712100, Shaanxi, China. E-mail: <email>huanglvwen@nwsuaf.edu.cn</email></corresp>
        <fn fn-type="other">
          <p>
            <bold>Received:</bold> 21 Oct 2025 |  <bold>First Decision:</bold> 31 Dec 2025 | <bold>Revised:</bold> 20 Mar 2026 | <bold>Accepted:</bold> 22 May 2026 |  <bold>Published:</bold> 18 Jun 2026</p>
        </fn>
        <fn fn-type="other">
          <p>
            <bold>Academic Editor:</bold> Simon Yang | <bold>Copy Editor:</bold> Pei-Yun Wang |  <bold>Production Editor:</bold> Pei-Yun Wang</p>
        </fn>
      </author-notes>
      <pub-date pub-type="ppub">
        <year>2026</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>18</day>
        <month>6</month>
        <year>2026</year>
      </pub-date>
      <volume>6</volume>
	  <issue>2</issue>
      <fpage>291</fpage>
	  <lpage>310</lpage>
      <permissions>
        <copyright-statement>© The Author(s) 2026.</copyright-statement>
        <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
          <license-p>© The Author(s) 2026. <bold>Open Access</bold> This article is licensed under a Creative Commons Attribution 4.0 International License (<uri xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</uri>), which permits unrestricted use, sharing, adaptation, distribution and reproduction in any medium or format, for any purpose, even commercially, as long as you give appropriate credit to the original author(s) and the source, provide a link to the Creative Commons license, and indicate if changes were made.</license-p>
        </license>
      </permissions>
      <abstract>
        <p>Lithium-ion batteries are core components of renewable generation and energy-storage systems and are widely deployed in PV/wind grid scheduling and e-mobility. Accurate remaining useful life (RUL) prediction is essential for operational stability and cost control. This paper proposes a battery life prediction approach that integrates channel-grouping half-convolution (CGHF) and a monotonic decreasing head (MDH) within a Mamba-based sequence modeling framework. CGHF reduces computational redundancy while strengthening multi-scale temporal representations; the selective state-space module of Mamba efficiently captures long-range dependencies; MDH imposes an explicit “non-increasing capacity” constraint at the decoder to enhance robustness and interpretability. Experiments on the National Aeronautics and Space Administration (NASA) Randomized Battery Usage Dataset and the Tongji University (TJU) Commercial Lithium-Ion Battery Cycling Dataset demonstrate superior RUL accuracy, achieving minimum capacity-prediction mean absolute errors (MAEs) of 0.0081 and 0.0009 Ah, respectively, outperforming strong baselines under the same settings. The method improves accuracy while maintaining fast inference, suggesting potential applicability to online health monitoring and maintenance planning, subject to further validation under more diverse operating conditions.</p>
      </abstract>
      <kwd-group>
        <kwd>Lithium-ion batteries</kwd>
        <kwd>remaining useful life</kwd>
        <kwd>Mamba</kwd>
        <kwd>channel-grouping half-convolution</kwd>
        <kwd>deep learning</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec id="sec1">
      <title>1. INTRODUCTION</title>
      <p>Lithium-ion batteries offer high energy density, long cycle stability, and low self-discharge<sup>[<xref ref-type="bibr" rid="B1">1</xref>]</sup>, making them the preferred power source for grid-scale energy storage and electric vehicles<sup>[<xref ref-type="bibr" rid="B2">2</xref>]</sup>. Their operational reliability directly affects the safety and economic performance of downstream systems. Artificial intelligence and digital twin technologies have been increasingly applied in intelligent battery management systems to enhance remaining useful life (RUL) prediction and lifecycle optimization<sup>[<xref ref-type="bibr" rid="B3">3</xref>]</sup>. However, during long-term charge-discharge cycles, degradation is driven by coupled multiphysics effects such as electrode structure deterioration and electrolyte decomposition. This process is highly nonlinear and time-dependent. The characteristic information is often hidden in the spatiotemporal evolution of multi-source monitoring data such as voltage, current, and temperature, which makes direct identification and modeling difficult<sup>[<xref ref-type="bibr" rid="B4">4</xref>]</sup>. At the same time, the prediction of RUL<sup>[<xref ref-type="bibr" rid="B5">5</xref>]</sup> still faces both theoretical and technical challenges. Capacity recovery, nonlinear degradation, and strong individual variation make mechanism-based modeling difficult. Data-driven approaches, although flexible, often suffer from weak spatiotemporal coupling, high noise sensitivity, and lack of physical constraints, which limits their generalization and reliability in practical applications<sup>[<xref ref-type="bibr" rid="B6">6</xref>]</sup>. Smart evolving fuzzy predictors optimized by firefly algorithms have been proposed to improve adaptability and robustness under noisy degradation conditions<sup>[<xref ref-type="bibr" rid="B7">7</xref>]</sup>. Therefore, achieving accurate, efficient, and physically consistent RUL prediction has become a key scientific challenge in the health management of modern energy storage systems.</p>
      <p>Current methods for lithium-ion battery RUL prediction can be divided into two main categories: model-based and data-driven<sup>[<xref ref-type="bibr" rid="B8">8</xref>,<xref ref-type="bibr" rid="B9">9</xref>]</sup>. Model-based methods describe degradation through electrochemical mechanisms or equivalent circuit models. For instance, the interactive multiple model particle flow filter (IMM-PFF) multi-model fusion method adapts to multi-stage degradation<sup>[<xref ref-type="bibr" rid="B2">2</xref>]</sup>, and Gaussian mixture resampling improves particle filtering to reduce uncertainty<sup>[<xref ref-type="bibr" rid="B10">10</xref>]</sup>. However, these methods rely heavily on prior physical assumptions and show weak generalization under complex or unseen conditions such as those in photovoltaic or wind power systems, making them unsuitable for dynamic storage environments<sup>[<xref ref-type="bibr" rid="B11">11</xref>]</sup>. Data-driven methods have progressively improved in feature fitting. GRU-based frameworks combined with feature selection and clustering have further improved SOH and RUL prediction performance<sup>[<xref ref-type="bibr" rid="B12">12</xref>]</sup>. Hybrid ensemble learning frameworks have also been proposed to enhance the stability and accuracy of RUL prediction<sup>[<xref ref-type="bibr" rid="B13">13</xref>]</sup>. Recent studies have shown that extracting health indicators from partial charging curves can effectively improve the accuracy and practicality of data-driven SOH and RUL estimation methods<sup>[<xref ref-type="bibr" rid="B14">14</xref>]</sup>. The discrete wavelet decomposition and support vector regression model (DWD-SVR)<sup>[<xref ref-type="bibr" rid="B15">15</xref>]</sup> and the general regression neural network optimized by gravity search algorithm and enhanced with extreme learning machine (GRNN-GSA-ELM)<sup>[<xref ref-type="bibr" rid="B16">16</xref>]</sup> have achieved progress in multi-scale fitting and small-sample robustness, while K-means clustering-random forest and particle swarm optimization-elastic net models optimize individual adaptability and feature selection<sup>[<xref ref-type="bibr" rid="B15">15</xref>]</sup>. Nevertheless, the nonlinear representation of multi-dimensional time series remains limited under traditional machine-learning frameworks. Improved Dempster-Shafer evidence theory has been applied to enhance multi-source information fusion in RUL prediction<sup>[<xref ref-type="bibr" rid="B17">17</xref>]</sup>. Deep learning techniques have substantially improved lithium-ion battery RUL prediction in recent years. Recurrent and hybrid architectures, including OOA-BiGRU<sup>[<xref ref-type="bibr" rid="B18">18</xref>]</sup>, CEEMDAN-CNN-BiGRU<sup>[<xref ref-type="bibr" rid="B19">19</xref>]</sup>, attention-based BiLSTM models<sup>[<xref ref-type="bibr" rid="B20">20</xref>]</sup>, CEEMDAN-BiLSTM-Transformer<sup>[<xref ref-type="bibr" rid="B21">21</xref>]</sup>, and 1D CNN-BLSTM frameworks<sup>[<xref ref-type="bibr" rid="B22">22</xref>]</sup>, have demonstrated enhanced temporal feature extraction capability. Transformer-based and multi-scale architectures, such as dynamic convolution transformers<sup>[<xref ref-type="bibr" rid="B23">23</xref>]</sup>, temporal convolution networks (TCN)<sup>[<xref ref-type="bibr" rid="B24">24</xref>]</sup>, transfer-learning AE-LSTM<sup>[<xref ref-type="bibr" rid="B25">25</xref>]</sup>, TransRUL<sup>[<xref ref-type="bibr" rid="B26">26</xref>]</sup>, comparative Transformer frameworks<sup>[<xref ref-type="bibr" rid="B27">27</xref>]</sup>, and hybrid Informer-LSTM models<sup>[<xref ref-type="bibr" rid="B28">28</xref>]</sup>, further improve long-sequence representation and degradation-stage awareness. However, major drawbacks remain. Most models extract temporal and spatial features separately, failing to capture the coupling among voltage, current, and temperature. The absence of physical constraints may lead to prediction trajectories that violate the capacity degradation mechanism. In addition, large parameter counts result in high inference costs<sup>[<xref ref-type="bibr" rid="B29">29</xref>]</sup>.</p>
      <p>Despite substantial progress, three key challenges remain in lithium-ion battery RUL prediction. First, spatiotemporal coupling of multi-dimensional features is insufficient. Most models handle voltage, current, and temperature independently in the temporal dimension and merge them by simple concatenation<sup>[<xref ref-type="bibr" rid="B30">30</xref>]</sup>, which fails to capture their dynamic relationships during degradation and leads to incomplete feature representations. Additionally, the prediction process lacks physical constraints. Many models rely purely on data fitting without embedding the fundamental physical law of irreversible capacity decay, resulting in unrealistic oscillations or increases in the predicted trajectories that contradict actual degradation behavior<sup>[<xref ref-type="bibr" rid="B31">31</xref>]</sup>. Finally, model efficiency and architecture innovation lag behind. Current deep-learning models are typically large and slow during inference, which restricts their use in real-time monitoring or edge deployment. Efficient architectures such as Mamba<sup>[<xref ref-type="bibr" rid="B32">32</xref>]</sup> and channel-grouped half convolution<sup>[<xref ref-type="bibr" rid="B33">33</xref>]</sup> have not yet been systematically applied to RUL prediction. Recent work has demonstrated that state space models (SSM) can effectively capture long-term degradation dependencies in early RUL prediction tasks<sup>[<xref ref-type="bibr" rid="B34">34</xref>]</sup>. Their potential advantages in long-sequence dependency modeling and computational efficiency have not been fully realized<sup>[<xref ref-type="bibr" rid="B35">35</xref>]</sup>.</p>
      <p>Overall, this study aims to improve the accuracy, efficiency, and physical consistency of lithium-ion battery RUL prediction. Unlike existing approaches that introduce isolated improvements, this work focuses on a task-oriented integration of multi-level feature modeling and physics-informed constraints. The main contributions are as follows.</p>
      <p>• A unified CGHF-VSN-Mamba framework is proposed to jointly model channel-level, variable-level, and temporal dependencies, enabling effective spatiotemporal coupling of battery degradation signals.</p>
      <p>• A channel-grouped half convolution combined with attention is designed to reduce redundancy while preserving informative features, forming a lightweight yet expressive representation mechanism.</p>
      <p>• A monotonic decreasing head (MDH) with adaptive gating is introduced to embed physical degradation constraints directly into the prediction process, improving both reliability and interpretability.</p>
      <p>These components are not simply combined, but structurally coordinated to address three core challenges simultaneously: feature redundancy, long-sequence modeling, and lack of physical consistency.</p>
    </sec>
    <sec id="sec2">
      <title>2. METHODS</title>
      <sec id="sec2-1">
        <title>2.1. Channel-grouping half-convolution</title>
        <p>In lithium-ion battery operation data, different variables and channel dimensions contain multi-scale degradation patterns. To capture local temporal dynamics while maintaining computational efficiency, a channel-grouping half-convolution (CGHF) module is introduced, as illustrated in <xref ref-type="fig" rid="fig1">Figure 1</xref>.</p>
        <fig id="fig1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Structure of the CGHF module. CGHF: Channel-grouping half-convolution; SE: Squeeze-and-Excitation.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="ir6015.fig.1.jpg" />
        </fig>
        <p>The key idea is to divide the input feature channels into several independent groups and use a “half-convolution plus half-bypass” structure within each group to achieve efficient modeling. Specifically, in each subgroup, half of the channels are processed by depth-wise separable convolution to extract local temporal features, while the remaining half are passed directly to preserve raw information. The two parts are then concatenated within the group and added to the input residual, balancing feature transformation and information fidelity.</p>
        <p>Meanwhile, the CGHF module incorporates a Squeeze-and-Excitation (SE) attention mechanism<sup>[<xref ref-type="bibr" rid="B36">36</xref>]</sup>. This mechanism first performs global average pooling on each channel, then applies two fully connected layers with dimensionality reduction, expansion, and nonlinear activation to generate channel-wise weights. Finally, channel-wise reweighting is applied to the concatenated features, allowing the model to adaptively highlight channels more sensitive to capacity degradation while suppressing redundant or noisy information.</p>
        <p>To balance local dynamic sensitivity and information fidelity, the input X ∈ ℝ<italic><sub>B</sub></italic><sub>×</sub><italic><sub>L</sub></italic><sub>×</sub><italic><sub>D</sub></italic> is evenly divided into G groups. For the <italic>i</italic>- group, the channels are halved: one path passes through convolution, while the other bypasses to retain the original data. The two paths are concatenated within each group, groups operate in parallel, and SE attention performs the final channel recalibration.</p>
        <p>The grouping and halving process are defined in Equation (1).</p>
		<p><disp-formula> <label>(1)</label> <tex-math id="E1"> $$  X^{(i)}=
\left[
X_{conv}^{(i)},
X_{keep}^{(i)}
\right] $$ </tex-math></disp-formula></p>
        <p>Here, <italic>X</italic><sup>(</sup><italic><sup>i</sup></italic><sup>)</sup> denotes the output feature of the iii-th group. <italic>X</italic><sup>(</sup><italic><sup>i</sup></italic><sup>)</sup><italic><sub>conv</sub> </italic>represents the half-channel feature processed by the depthwise convolution branch, while <italic>X</italic><sup>(</sup><italic><sup>i</sup></italic><sup>)</sup><italic><sub>keep</sub></italic> denotes the bypassed half-channel feature that preserves the original information. The in-group convolution extraction is defined in Equation (2).</p>
		<p><disp-formula> <label>(2)</label> <tex-math id="E1"> $$  \tilde{Y}^{(i)}
=
\phi\!\left(
\mathrm{BN}_{i}
\!\left(
\mathrm{Conv1d}_{i}
\!\left(
X_{conv}^{(i)}
\right)
\right)
\right) $$ </tex-math></disp-formula></p>
        <p>In Equation (2), <inline-formula><tex-math id="M1">$$ \tilde{Y}^{(i)}  $$</tex-math></inline-formula> denotes the intermediate feature extracted by the convolutional branch within the iii-th group. The term <italic>X</italic><sup>(</sup><italic><sup>i</sup></italic><sup>)</sup><italic><sub>conv</sub></italic> corresponds to the convolutional half-channel feature defined in Equation (1). The bypass and concatenation are expressed in Equation (3).</p>
		<p><disp-formula> <label>(3)</label> <tex-math id="E1"> $$  Y^{(i)}
=
\left[
\tilde{Y}^{(i)},
X_{keep}^{(i)}
\right] $$ </tex-math></disp-formula></p>
        <p>The SE recalibration is defined in Equation (4).</p>
		<p><disp-formula> <label>(4)</label> <tex-math id="E1"> $$  Y=
\left(
Cat_{i}\,Y^{(i)}
\right)
\odot
\sigma
\!\left(
W_{2}\,
\phi
\!\left(
W_{1}\,
GAP
\!\left(
Cat_{i}\,Y^{(i)}
\right)
\right)
\right) $$ </tex-math></disp-formula></p>
        <p>In Equation (4), <italic>Y</italic> denotes the final output of the CGHF module after channel-wise recalibration. <italic>CatY</italic><sup>(</sup><italic><sup>i</sup></italic><sup>)</sup> represents the concatenated features from all groups. <italic>W</italic><sub>1</sub> and <italic>W</italic><sub>2</sub> are the learnable weight matrices of the two fully connected layers in the SE attention, responsible for channel-wise dimensionality reduction and expansion.The resulting sigmoid activation generates channel weights that re-scale the concatenated features through Hadamard multiplication. Where Ø denotes GELU, BN denotes batch normalization, Conv1d denotes one-dimensional convolution, GAP denotes global average pooling, σ denotes the sigmoid function, <inline-formula><tex-math id="M1">$$ \odot  $$</tex-math></inline-formula> represents Hadamard channel-wise multiplication, and Cat indicates channel-wise concatenation.</p>
        <p>Compared with conventional convolutional structures, CGHF reduces redundancy through two mechanisms. First, the half-bypass design preserves raw features, avoiding excessive transformation that may amplify noise. Second, the SE attention dynamically suppresses channels with low contribution, ensuring that redundant information is not propagated to subsequent modules. This design is further complemented by the variable selection network (VSN) module at the variable level, forming a hierarchical redundancy reduction strategy.</p>
      </sec>
      <sec id="sec2-2">
        <title>2.2. VSN</title>
        <p>In multivariate operation data, different features affect battery life to varying degrees. Treating all variables equally during prediction introduces feature redundancy and weakens the contribution of degradation-sensitive variables, thereby reducing both prediction accuracy and interpretability. To address this issue, the model incorporates a VSN that performs adaptive weighting and selection of input variables, as shown in <xref ref-type="fig" rid="fig2">Figure 2</xref>.</p>
        <fig id="fig2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Structure of the VSN module. VSN: Variable selection network; GRN: gated residual network.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="ir6015.fig.2.jpg" />
        </fig>
        <p>Specifically, the VSN constructs an independent gated residual subnetwork for each input variable to generate its candidate representation. This process ensures that every variable undergoes an independent nonlinear transformation before weighting, allowing the network to capture its latent temporal characteristics. Then, all candidate representations are concatenated and passed into a weight generation network, which applies a sparsified softmax distribution to assign variable weights. This sparsity mechanism suppresses the influence of secondary variables and highlights the most important ones during aggregation.</p>
        <p>Finally, the VSN fuses the weighted variable representations into a unified temporal feature representation. This module reduces redundancy in the input feature space and enhances interpretability by explicitly indicating which operational variables play a dominant role in the prediction of battery life. The sparsified softmax weighting enables the model to focus on a subset of dominant variables while suppressing less informative ones. Although explicit visualization such as heatmaps is not included in this study, the effectiveness of this mechanism is indirectly validated through ablation experiments, where the inclusion of VSN good robustness prediction accuracy. Future work will incorporate visualization techniques to further enhance interpretability.</p>
      </sec>
      <sec id="sec2-3">
        <title>2.3. Mamba encoder and selective scanning</title>
        <p>Currently, deep learning research on sequence modeling mainly focuses on recurrent neural networks (RNNs) and Transformer architectures. The former often suffers from gradient vanishing when modeling long-term dependencies, while the latter can capture global relationships but has a quadratic computational complexity O(<italic>L</italic><sup>2</sup>) in its self-attention mechanism, leading to high computation and memory costs in long-sequence tasks. To address this issue, the Mamba model has been proposed. Its core idea is to build upon SSM and the Selective Scan mechanism to capture long-range dependencies efficiently while maintaining linear time complexity O(<italic>L</italic>) as shown in <xref ref-type="fig" rid="fig3">Figure 3</xref>.</p>
        <fig id="fig3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Structure of the Mamba state-space modeling module. SSM: State space models.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="ir6015.fig.3.jpg" />
        </fig>
        <p>In this study, Mamba is employed to efficiently model the full life-cycle capacity curve of lithium-ion batteries. The degradation process exhibits strong long-term dependencies, and relying solely on local statistical features fails to represent the overall degradation trend. The SSM mechanism in Mamba dynamically updates hidden states through parameterized transition matrices (<italic>A</italic>, <italic>B</italic>, <italic>C</italic>, Δ, <italic>D</italic>), capturing both short-term fluctuations and long-term decay patterns. This enables the model to generate stable feature representations for RUL prediction.</p>
        <p>The Mamba module consists of four components:</p>
        <p>Input projection (in_proj) - The input sequence is linearly mapped into two parts: a hidden-state representation and a residual signal. This prepares the data for state updates and subsequent feature fusion.</p>
        <p>Depthwise convolution (conv1d) - A one-dimensional depthwise convolution is applied along the sequence dimension to extract local neighborhood information and enhance temporal smoothness. This operation is implemented as grouped convolution in the MambaBlock.</p>
        <p>State-space recurrence (ssm) - The module performs the Selective Scan process using parameterized matrices A, B, C, D and a dynamic step size ∆ computed from the input, as expressed in Equation (5)<sup>[<xref ref-type="bibr" rid="B32">32</xref>]</sup>.</p>
		<p><disp-formula> <label>(5)</label> <tex-math id="E1"> $$  x_t
=
\Delta Ax_{t-1}
+
\Delta Bu_t,
\quad 
y_t
=
C x_t
+
D u_t $$ </tex-math></disp-formula></p>
        <p>In Equation (5), <italic>x<sub>t</sub></italic> denotes the hidden state of the state-space model at time step <italic>t</italic>, and <italic>x<sub>t</sub></italic><sub>-1</sub> is the previous hidden state. <italic>u<sub>t</sub></italic> represents the input signal derived from the projected feature sequence, while <italic>y<sub>t</sub></italic> denotes the output of the SSM at the current step. <italic>A</italic>, <italic>B</italic>, <italic>C</italic>, and <italic>D</italic> are learnable state transition, input mapping, output projection, and direct feed-through matrices, respectively, which jointly govern the evolution of the system dynamics. The term Δ acts as a data-dependent dynamic step size, modulating the discrete-time update and enabling the selective scan mechanism to adjust temporal scaling adaptively. Here, ∆ is constrained to be non-negative through the softplus function, ensuring reasonable time-step scaling. This mechanism is the key for Mamba to effectively capture long-range dependencies.</p>
        <p>Residual connection and output projection (out_proj) - The recursive output is combined with the residual signal and projected linearly back to the original dimension. This preserves information and enhances representational capacity.</p>
        <p>In the overall framework, the hidden-state sequence output by the Mamba module is used to generate contextual representations and is further combined with the trend-constrained module (MDH) to ensure physically consistent predictions.</p>
      </sec>
      <sec id="sec2-4">
        <title>2.4. MDH</title>
        <p>In lithium-ion battery lifetime prediction, battery capacity generally follows an overall decreasing trend as the cycle number increases. However, apparent local recovery may occur because of relaxation effects, temperature variations, or measurement noise. Purely data-driven deep learning models may violate this degradation characteristic and generate locally increasing predictions that lack physical plausibility and interpretability. To address this, a MDH is designed to impose a physical constraint on the predicted capacity at the output stage, as shown in <xref ref-type="fig" rid="fig4">Figure 4</xref>.</p>
        <fig id="fig4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Structure of the MDH module. MDH: Monotonic decreasing head.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="ir6015.fig.4.jpg" />
        </fig>
        <p>To ensure non-increasing capacity, the MDH outputs a non-negative “decrement value” and constrains its relative magnitude. The result is then adaptively fused with the original regression head through a gating mechanism. The previous-step capacity <italic>y<sub>t</sub></italic>, local trend Δ<italic>h<sub>t</sub></italic> = <italic>h<sub>t</sub><sup>last</sup></italic> - <italic>h<sub>t</sub></italic><sub>-1</sub><italic><sup>last</sup></italic>, and contextual representation <italic>c<sub>t</sub></italic> are all integrated in this process.</p>
        <p>The trend-aware decrement is defined in Equation (6).</p>
		<p><disp-formula> <label>(6)</label> <tex-math id="E1"> $$  \Delta_t
=
\operatorname{softplus}
\!\left(
f_{\theta}
\!\left(
[c_t,\Delta h_t]
\right)
\right)
\ge 0 $$ </tex-math></disp-formula></p>
        <p>In Equation (6), <italic>c<sub>t</sub></italic> denotes the contextual hidden representation output by the sequence encoder at step <italic>t</italic>, while Δ<italic>h<sub>t</sub></italic> represents the local trend descriptor extracted from the recent degradation trajectory. The function <italic>f<sub>θ</sub></italic>(·) is a two-layer multilayer perceptron that maps the concatenated features into a latent decrement score, which is then transformed into a non-negative value through the softplus function. The upper bound of the relative decrement is defined in Equation (7).</p>
		<p><disp-formula> <label>(7)</label> <tex-math id="E1"> $$  \Delta_t
\leftarrow
\min
\left\{
\Delta_t,
\eta y_t
\right\},
\quad
0&lt; \eta &lt;1 $$ </tex-math></disp-formula></p>
        <p>This structure ensures that the predicted capacity strictly decreases across cycles. The monotonic branch is expressed in Equation (8).</p>
		<p><disp-formula> <label>(8)</label> <tex-math id="E1"> $$  y_{t+1}^{mono}
=
y_t-\Delta_t
\le y_t $$ </tex-math></disp-formula></p>
        <p>In Equation (8), <italic>y<sub>t</sub></italic><sub>+1</sub><italic><sup>mono</sup> </italic>denotes the monotonicity-enforced capacity prediction. The term <italic>y<sub>t</sub></italic> is the previous capacity. The fusion of the main and auxiliary prediction branches is defined in Equation (9).</p>
		<p><disp-formula> <label>(9)</label> <tex-math id="E1"> $$  \hat{y}_{t+1}^{raw}
=
\lambda
\hat{y}_{t+1}^{main}
+
(1-\lambda)
\hat{y}_{t+1}^{aux},
\quad
\lambda=0.65 $$ </tex-math></disp-formula></p>
        <p>In Equation (9), <inline-formula><tex-math id="M1">$$ \hat{y} $$</tex-math></inline-formula><italic><sub>t</sub></italic><sub>+1</sub><italic><sup>main</sup></italic> is the output of the original regression head, whereas <inline-formula><tex-math id="M1">$$ \hat{y} $$</tex-math></inline-formula><italic><sub>t</sub></italic><sub>+1</sub><italic><sup>aux</sup></italic> is the auxiliary prediction produced by the monotonic branch. Their weighted combination yields the intermediate prediction <inline-formula><tex-math id="M1">$$ \hat{y} $$</tex-math></inline-formula><italic><sub>t</sub></italic><sub>+1</sub><italic><sup>raw</sup></italic>. The coefficient <italic>λ</italic> balances the contribution of the two branches and is empirically set to 0.65 to retain flexibility while preserving physical plausibility. The violation-adaptive gating mechanism is described in Equation (10).</p>
		<p><disp-formula> <label>(10)</label> <tex-math id="E1"> $$  \hat{y}_{t+1}
=
g_t
y_{t+1}^{mono}
+
(1-g_t)
\hat{y}_{t+1}^{raw}\\
g_t
=
clip
\!\left(
\sigma
\!\left(
W_g c_t
\right)
+
\beta
\Bigl[
\hat{y}_{t+1}^{raw}
>
y_t
\Bigr],
\,0,\,1
\right) $$ </tex-math></disp-formula></p>
        <p>In Equation (10), <italic>g<sub>t</sub></italic> is a gating coefficient that adaptively increases when a physical violation occurs, directing the prediction toward the monotonic branch. The term <italic>W<sub>g</sub></italic> is the learnable projection matrix that maps the contextual representation <italic>c<sub>t</sub></italic> into a gating score, while <italic>β</italic> amplifies the gate when the intermediate prediction <italic>y<sub>t</sub></italic><sub>+1</sub><italic><sup>mono</sup></italic> exceeds the previous value <italic>y<sub>t</sub></italic>. The indicator function [<inline-formula><tex-math id="M1">$$ \hat{y} $$</tex-math></inline-formula><italic><sub>t</sub></italic><sub>+1</sub><italic><sup>raw</sup> </italic>&gt; <italic>y<sub>t</sub></italic>] triggers this adjustment. The final prediction <inline-formula><tex-math id="M1">$$ \hat{y} $$</tex-math></inline-formula><italic><sub>t</sub></italic><sub>+1</sub> is thus obtained as a gated fusion of the monotonic and raw branches, ensuring full physical consistency.</p>
        <p>The MDH module integrates three types of inputs: the contextual representation at the current step, local trend information, and the previous capacity value. It outputs the predicted capacity change Δ, which is strictly non-negative. A relative upper bound constraint is applied to Δ, ensuring that the decrease does not exceed a certain ratio of the previous capacity. The final predicted capacity is then obtained by <inline-formula><tex-math id="M1">$$ \hat{y} $$</tex-math></inline-formula><italic><sub>t</sub></italic><sub>+1</sub> = <italic>y<sub>t</sub></italic> - Δ, guaranteeing monotonic degradation over time.</p>
        <p>Additionally, the MDH is fused with the main prediction branch (original regression head) through an adaptive gating mechanism. When the main prediction violates physical constraints (i.e., the predicted capacity exceeds the previous value), the gate value increases, assigning higher weight to the physically consistent branch. When the prediction follows the physical rule, the main branch dominates. This adaptive fusion achieves a balance between physical consistency and model flexibility.</p>
        <p>Practical note. In real-world battery operation, apparent local capacity recovery can be observed due to relaxation phenomena, temperature changes, and measurement noise. The proposed MDH is intended to improve long-horizon trend consistency and suppress non-physical upward oscillations in predictions, rather than to explicitly model reversible short-term behaviors. Therefore, strict monotonic enforcement may reduce flexibility in scenarios dominated by recovery effects, particularly in early-life stages. Exploring soft/uncertainty-aware monotonic constraints is an important direction for future work.</p>
      </sec>
    </sec>
    <sec id="sec3">
      <title>3. EXPERIMENTS</title>
      <sec id="sec3-1">
        <title>3.1. Dataset</title>
        <p>This study uses the National Aeronautics and Space Administration (NASA) battery dataset as the primary benchmark and introduces the TJU dataset to evaluate the generalization capability of the proposed model under multivariable conditions<sup>[<xref ref-type="bibr" rid="B32">32</xref>]</sup>. The NASA dataset, provided by the NASA, contains full discharge cycle data for four lithium-ion batteries (B0005, B0006, B0007, and B0018) under constant operating conditions. The core variable is the trajectory of capacity degradation with respect to cycle count, which has become one of the most widely used benchmark datasets for RUL prediction. To simulate practical rolling prediction scenarios, the capacity sequences were truncated at different starting points (SP = 50, 70, and 90) to initialize the prediction process. These settings cover both the early and rapid degradation stages, enabling evaluation of model stability and robustness under different observation windows.</p>
        <p>In contrast, the TJU dataset, proposed by Tongji University and collaborators, provides more complex cycling information. In addition to capacity, it includes multiple statistical features of voltage and current during constant current (CC) and constant voltage (CV) stages, such as mean, variance, kurtosis, skewness, slope, and entropy. Incorporating the TJU dataset serves two purposes: Firstly, to demonstrate that the proposed model maintains strong predictive performance in high-dimensional feature spaces; and secondly, to verify its generalization capability across datasets. For consistency, the TJU dataset was evaluated at starting points SP is equal to 200, 300, and 400, allowing assessment of prediction behavior over longer historical cycles.</p>
        <p>Notably, although the NASA dataset is essentially univariate, the input sequence is first projected into a higher-dimensional latent space before being processed by CGHF. Therefore, multi-scale feature extraction is still performed across latent channels. Nevertheless, the full advantage of CGHF is more evident in multivariate scenarios, which is further validated using the TJU dataset.</p>
        <p>
          <xref ref-type="fig" rid="fig5">Figure 5</xref> illustrates the capacity degradation curves of the two datasets, while <xref ref-type="table" rid="t1">Table 1</xref> lists the basic specifications of the cells, including model type, rated capacity, charge–discharge protocol, and temperature conditions.</p>
        <fig id="fig5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>(A) NASA dataset and (B) TJU dataset: capacity degradation curves of lithium-ion batteries in both datasets. NASA: National Aeronautics and Space Administration; TJU: Tongji University.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="ir6015.fig.5.jpg" />
        </fig>
        <table-wrap id="t1">
          <label>Table 1</label>
          <caption>
            <p>Battery parameter information of the NASA and TJU datasets</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Source</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>ID</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Charge/discharge cut-off voltage</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Charge/discharge CC</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Temperature</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Rated capacity</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>End-of-Life criteria</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td rowspan="4">NASA</td>
                <td>B0005</td>
                <td>4.2 V / 2.7 V</td>
                <td>1.5 A / 2 A</td>
                <td>24 °C</td>
                <td>2 Ah</td>
                <td>1.4 Ah</td>
              </tr>
              <tr>
                <td>B0006</td>
                <td>4.2 V / 2.5 V</td>
                <td>1.5 A / 2 A</td>
                <td>24 °C</td>
                <td>2 Ah</td>
                <td>1.4 Ah</td>
              </tr>
              <tr>
                <td>B0007</td>
                <td>4.2 V / 2.2 V</td>
                <td>1.5 A / 2 A</td>
                <td>24 °C</td>
                <td>2 Ah</td>
                <td>1.4 Ah</td>
              </tr>
              <tr>
                <td>B0018</td>
                <td>4.2 V / 2.5 V</td>
                <td>1.5 A / 2 A</td>
                <td>24 °C</td>
                <td>2 Ah</td>
                <td>1.4 Ah</td>
              </tr>
              <tr>
                <td rowspan="3">TJU</td>
                <td>CY25_1</td>
                <td>4.2 V / 2.5 V</td>
                <td>1.25 A / 2.5 A</td>
                <td>25 °C</td>
                <td>2.5 Ah</td>
                <td>1.75 Ah</td>
              </tr>
              <tr>
                <td>CY25_2</td>
                <td>4.2 V / 2.5 V</td>
                <td>1.25 A / 2.5 A</td>
                <td>25 °C</td>
                <td>2.5 Ah</td>
                <td>1.75 Ah</td>
              </tr>
              <tr>
                <td>CY25_4</td>
                <td>4.2 V / 2.5 V</td>
                <td>1.25 A / 2.5 A</td>
                <td>25 °C</td>
                <td>2.5 Ah</td>
                <td>1.75 Ah</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>NASA: National Aeronautics and Space Administration; TJU: Tongji University; CC: constant current.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec id="sec3-2">
        <title>3.2. Data cleaning and feature construction</title>
        <p>For the NASA dataset, the raw records contain missing cycles and local abnormal fluctuations; therefore, a two-step correction strategy is adopted. Initially, the entire cycle range from 1 to the maximum is completed, and missing capacity values are reconstructed by linear interpolation. Subsequently, outliers are detected using the 2σ criterion and masked, followed by another linear interpolation to smooth the capacity trajectory. The resulting capacity curve becomes smoother and exhibits an approximately monotonic decline, which is consistent with the overall irreversible degradation trend of lithium-ion batteries under controlled cycling.</p>
        <p>Notably, the above interpolation and sigma-based masking are mainly used to handle missing cycles and apparent outliers in the NASA records, rather than to remove realistic short-term recovery behaviors. This preprocessing results in a smoother and approximately monotonic trajectory, which may attenuate local capacity recovery caused by relaxation or measurement noise. Accordingly, the current benchmark setting may not fully reflect reversible short-term behaviors, and we regard evaluation on raw (non-monotonized) trajectories under broader operating conditions as an important direction for future work.</p>
        <p>For the TJU dataset, the 3σ rule is applied to all numerical feature columns, removing rows where values exceed three standard deviations from the mean. The cycle indices are then renumbered to ensure sequence continuity. In the feature selection stage, 17 health-related statistical features are retained, including the mean, standard deviation, kurtosis, skewness, slope, and entropy of voltage and current during the CC and CV phases, as well as charging time and capacity. Compared with the univariate NASA dataset, the multidimensional TJU features provide a more comprehensive description of the degradation process, supporting verification of the model’s variable selection and channel attention mechanisms.</p>
      </sec>
      <sec id="sec3-3">
        <title>3.3. Data partitioning</title>
        <p>As shown in <xref ref-type="table" rid="t2">Table 2</xref>, all data are divided into two parts: a training set and a test set. Within the training data, the first 80% of cycles in chronological order are used for model training, and the remaining 20% are used for validation to monitor early stopping and select hyperparameters. For the NASA dataset, which serves as the main experimental benchmark, the full-cycle data from batteries B0006, B0007, and B0018 are used for training, while B0005 is reserved as an independent test sample to evaluate cross-cell generalization and rolling prediction performance at different starting points (SP). For the TJU dataset, which tests generalization in a multivariable feature space, CY25_2 and CY25_4 are merged as the training set, and CY25_1 is used for testing.</p>
        <table-wrap id="t2">
          <label>Table 2</label>
          <caption>
            <p>Partitioning of the NASA and TJU datasets</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Dataset</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Training dataset</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Test dataset</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td>NASA</td>
                <td>B0006 B0007 B0018</td>
                <td>B0005</td>
              </tr>
              <tr>
                <td>TJU</td>
                <td>CY25_2 CY25_4</td>
                <td>CY25_1</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>NASA: National Aeronautics and Space Administration; TJU: Tongji University.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>During testing, evaluation begins at the predefined starting points for each dataset (NASA: 50/70/90; TJU: 200/300/400). To strictly prevent data leakage, all normalization parameters are computed exclusively from the training set and then fixed for use in validation and testing. This setup ensures independence under cross-battery conditions and maintains consistency in constructing multi-start and single-step prediction windows, facilitating fair comparisons between datasets and reproducibility of experiments.</p>
      </sec>
      <sec id="sec3-4">
        <title>3.4. Overall architecture</title>
        <p>The model architecture consists of four main components, and the overall framework is shown in <xref ref-type="fig" rid="fig6">Figure 6</xref>.</p>
        <fig id="fig6" position="float" width="450">
          <label>Figure 6</label>
          <caption>
            <p>Overall architecture of the proposed CGHF-MDH-Mamba model. CGHF: Channel-grouping half-convolution; MDH: monotonic decreasing head.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="ir6015.fig.6.jpg" />
        </fig>
        <p>First, CGHF operates at the channel level to compress redundant feature maps and enhance local temporal patterns with lightweight grouped half-convolution and channel attention before sequence modeling. Additionally, VSN operates at the variable level to assign adaptive importance weights across heterogeneous input variables, improving feature saliency and interpretability in multivariate settings. In this sense, CGHF and VSN play complementary roles: the former suppresses intra-channel redundancy, while the latter reduces inter-variable redundancy. Third, the Mamba sequence modeling module captures long-range dependencies and fuses local and global contextual information to better represent complex degradation patterns after feature refinement. Finally, a MDH imposes a physical constraint that forces the predicted capacity to decrease monotonically with cycles, ensuring consistency with electrochemical degradation laws. These modules operate in a complementary manner to improve multivariate degradation modeling, prediction consistency, and generalization capability.</p>
      </sec>
    </sec>
    <sec id="sec4">
      <title>4. RESULTS AND DISCUSSION</title>
      <sec id="sec4-1">
        <title>4.1. Experimental environment</title>
        <p>The experiments were conducted on an Ubuntu 22.04 operating system using the PyTorch deep learning framework. The detailed hardware and software configurations are listed in <xref ref-type="table" rid="t3">Table 3</xref>.</p>
        <table-wrap id="t3">
          <label>Table 3</label>
          <caption>
            <p>Experimental environment configuration</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Item</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Configuration information</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td>Operating system</td>
                <td>Ubuntu 22.04</td>
              </tr>
              <tr>
                <td>Development language</td>
                <td>Python 3.10.13</td>
              </tr>
              <tr>
                <td>Framework</td>
                <td>PyTorch 1.13.1 + cuda 11.7</td>
              </tr>
              <tr>
                <td>CPU</td>
                <td>Intel(R) Core(TM) i5-14600KF</td>
              </tr>
              <tr>
                <td>GPU</td>
                <td>GeForce RTX 4070 Ti SUPER(16G)</td>
              </tr>
              <tr>
                <td>Memory</td>
                <td>64 GB</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>CPU: Central Processing Unit; GPU: Graphics Processing Unit.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>During training, the AdamW optimizer was used with a learning rate of 1 × 10<sup>-3</sup>, a batch size of 128, and a maximum of 1,000 epochs. An early stopping strategy was applied to prevent overfitting. The sequence length was set to 64, and the prediction step was set to 1. All hyperparameters were tuned based on validation performance to ensure fairness and reproducibility of the experimental results.</p>
      </sec>
      <sec id="sec4-2">
        <title>4.2. Evaluation metrics</title>
        <p>In this study, five evaluation metrics are used to assess the prediction performance of the model at each starting point (SP): mean absolute error (MAE), root mean square error (RMSE), coefficient of determination (R<sup>2</sup>), absolute error (AE), and relative error (RE). The definitions and corresponding formulas for these metrics are summarized in <xref ref-type="table" rid="t4">Table 4</xref>. In this study, MAE and RMSE are calculated on battery capacity prediction values and are reported in Ah. AE is reported in cycles, whereas R<sup>2</sup> and RE are dimensionless.</p>
        <table-wrap id="t4">
          <label>Table 4</label>
          <caption>
            <p>Evaluation indicators</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Evaluation metrics</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Formula</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Significance</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td>MAE (Ah)</td>
                <td><inline-formula><tex-math id="M1">$$ MAE
=
\frac{1}{N}
\sum_{i=1}^{N}
\left|
y_i-\hat{y}_i
\right| $$</tex-math></inline-formula></td>
                <td>The absolute value of the error between the predicted and true values is averaged. Value range: ≥ 0, the smaller the better</td>
              </tr>
              <tr>
                <td>RMSE (Ah)</td>
                <td><inline-formula><tex-math id="M1">$$ RMSE
=
\sqrt{
\frac{1}{N}
\sum_{i=1}^{N}
\left(
y_i-\hat{y}_i
\right)^2
} $$</tex-math></inline-formula></td>
                <td>Similar to MAE, but more sensitive to “points with large deviations”. Value range: ≥ 0, the smaller the better</td>
              </tr>
              <tr>
                <td>R<sup>2</sup></td>
                <td><inline-formula><tex-math id="M1">$$ R^2
=
1-
\frac{
\sum
\left(
y_i-\hat{y}_i
\right)^2
}{
\sum
\left(
y_i-\bar{y}
\right)^2
} $$</tex-math></inline-formula></td>
                <td>Measures the degree to which predicted values explain true values. Numerical range: (-∞; 1], the closer the perfect prediction is to 1, the better</td>
              </tr>
              <tr>
                <td>AE (for RUL, cycles)</td>
                <td><inline-formula><tex-math id="M1">$$ \left|
RUL_{true}
-
RUL_{pred}
\right| $$</tex-math></inline-formula></td>
                <td>The difference between the predicted RUL (remaining life cycle number) and the real RUL</td>
              </tr>
              <tr>
                <td>RE (for RUL)</td>
                <td><inline-formula><tex-math id="M1">$$ RE
=
\frac{
\left|
RUL_{true}
-
RUL_{pred}
\right|
}{
RUL_{true}
} $$</tex-math></inline-formula></td>
                <td>The ratio of RUL prediction error to true life. Value range: 0-1, the smaller the better</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>MAE: Mean absolute error; RMSE: root mean square error; R<sup>2</sup>: coefficient of determination; AE: absolute error; RUL: remaining useful life; RE: relative error.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec id="sec4-3">
        <title>4.3. Comparative experiments</title>
        <p>To comprehensively evaluate the performance of the proposed model, comparative experiments were conducted on both the NASA and TJU battery datasets.</p>
        <p>For the NASA dataset, which primarily consists of univariate sequences describing capacity degradation over cycles, the experiments focused on evaluating the model’s RUL prediction capability based on a single health indicator. As shown in <xref ref-type="fig" rid="fig7">Figure 7</xref> and <xref ref-type="table" rid="t5">Table 5</xref>, other deep learning models-such as Autoformer, FEDformer, and PatchTST-can partially capture the degradation trend but exhibit larger errors across different starting points (SP = 50, 70, and 90). In contrast, the RUL-Mamba model achieves lower prediction errors, benefiting from the ability of the state-space recurrence mechanism to model long-term dependencies. The proposed CGHF-MDH-Mamba model further improves prediction accuracy, achieving a minimum MAE of 0.0081. These results indicate that the integration of channel half-convolution and monotonic constraints improves prediction stability and maintains competitive performance in univariate scenarios.</p>
        <fig id="fig7" position="float">
          <label>Figure 7</label>
          <caption>
            <p>Comparison between predicted and measured battery capacity trajectories on the NASA dataset under different prediction starting points. Comparison curve between predicted value and true value when (A) SP = 50; (B) SP = 70; (C) SP = 90. NASA: National Aeronautics and Space Administration; SP: starting point.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="ir6015.fig.7.jpg" />
        </fig>
        <table-wrap id="t5">
          <label>Table 5</label>
          <caption>
            <p>RUL prediction results of different models on NASA dataset</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Dataset</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Method</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>SP</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>TRUL</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PRUL</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>MAE (Ah)</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>RMSE (Ah)</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>R<sup>2</sup></bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>AE (cycles)</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>RE</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td rowspan="27">NASA</td>
                <td rowspan="3">Autoformer</td>
                <td>50</td>
                <td>75</td>
                <td>74.8</td>
                <td>0.0234</td>
                <td>0.0336</td>
                <td>0.9341</td>
                <td>3.6</td>
                <td>0.0486</td>
              </tr>
              <tr>
                <td>70</td>
                <td>55</td>
                <td>52.3</td>
                <td>0.0230</td>
                <td>0.0340</td>
                <td>0.8721</td>
                <td>4.1</td>
                <td>0.0759</td>
              </tr>
              <tr>
                <td>90</td>
                <td>35</td>
                <td>32.8</td>
                <td>0.0213</td>
                <td>0.0313</td>
                <td>0.8153</td>
                <td>4.2</td>
                <td>0.1235</td>
              </tr>
              <tr>
                <td rowspan="3">FEDformer</td>
                <td>50</td>
                <td>75</td>
                <td>74.9</td>
                <td>0.0215</td>
                <td>0.0266</td>
                <td>0.9569</td>
                <td>4.7</td>
                <td>0.0635</td>
              </tr>
              <tr>
                <td>70</td>
                <td>55</td>
                <td>53.6</td>
                <td>0.0199</td>
                <td>0.0262</td>
                <td>0.9217</td>
                <td>5.0</td>
                <td>0.0926</td>
              </tr>
              <tr>
                <td>90</td>
                <td>35</td>
                <td>32.6</td>
                <td>0.0172</td>
                <td>0.0237</td>
                <td>0.8961</td>
                <td>5.8</td>
                <td>0.1706</td>
              </tr>
              <tr>
                <td rowspan="3">PathFormer</td>
                <td>50</td>
                <td>75</td>
                <td>70.3</td>
                <td>0.0274</td>
                <td>0.0375</td>
                <td>0.9228</td>
                <td>5.1</td>
                <td>0.0689</td>
              </tr>
              <tr>
                <td>70</td>
                <td>55</td>
                <td>50.0</td>
                <td>0.0214</td>
                <td>0.0292</td>
                <td>0.9100</td>
                <td>5.6</td>
                <td>0.1037</td>
              </tr>
              <tr>
                <td>90</td>
                <td>35</td>
                <td>27.1</td>
                <td>0.0186</td>
                <td>0.0248</td>
                <td>0.8941</td>
                <td>7.9</td>
                <td>0.2324</td>
              </tr>
              <tr>
                <td rowspan="3">TimesNet</td>
                <td>50</td>
                <td>75</td>
                <td>78.0</td>
                <td>0.0364</td>
                <td>0.0478</td>
                <td>0.8753</td>
                <td>3.0</td>
                <td>0.0405</td>
              </tr>
              <tr>
                <td>70</td>
                <td>55</td>
                <td>57.9</td>
                <td>0.0298</td>
                <td>0.0403</td>
                <td>0.8349</td>
                <td>2.9</td>
                <td>0.0537</td>
              </tr>
              <tr>
                <td>90</td>
                <td>35</td>
                <td>38.0</td>
                <td>0.0213</td>
                <td>0.0275</td>
                <td>0.8699</td>
                <td>3.0</td>
                <td>0.0882</td>
              </tr>
              <tr>
                <td rowspan="3">TimeMixer</td>
                <td>50</td>
                <td>75</td>
                <td>79.8</td>
                <td>0.0239</td>
                <td>0.0285</td>
                <td>0.9540</td>
                <td>8.0</td>
                <td>0.1081</td>
              </tr>
              <tr>
                <td>70</td>
                <td>55</td>
                <td>52.7</td>
                <td>0.0241</td>
                <td>0.0298</td>
                <td>0.9014</td>
                <td>6.7</td>
                <td>0.1241</td>
              </tr>
              <tr>
                <td>90</td>
                <td>35</td>
                <td>26.0</td>
                <td>0.0203</td>
                <td>0.0307</td>
                <td>0.8290</td>
                <td>9.0</td>
                <td>0.2647</td>
              </tr>
              <tr>
                <td rowspan="3">PatchTST</td>
                <td>50</td>
                <td>75</td>
                <td>79.2</td>
                <td>0.0260</td>
                <td>0.0319</td>
                <td>0.9405</td>
                <td>4.2</td>
                <td>0.0568</td>
              </tr>
              <tr>
                <td>70</td>
                <td>55</td>
                <td>56.7</td>
                <td>0.0201</td>
                <td>0.0250</td>
                <td>0.9333</td>
                <td>3.9</td>
                <td>0.0722</td>
              </tr>
              <tr>
                <td>90</td>
                <td>35</td>
                <td>30.4</td>
                <td>0.0150</td>
                <td>0.0212</td>
                <td>0.9209</td>
                <td>5.0</td>
                <td>0.1471</td>
              </tr>
              <tr>
                <td rowspan="3">MambaLithium</td>
                <td>50</td>
                <td>75</td>
                <td>81.7</td>
                <td>0.0301</td>
                <td>0.0362</td>
                <td>0.9254</td>
                <td>6.7</td>
                <td>0.0905</td>
              </tr>
              <tr>
                <td>70</td>
                <td>55</td>
                <td>60.7</td>
                <td>0.0250</td>
                <td>0.0305</td>
                <td>0.9034</td>
                <td>5.7</td>
                <td>0.1056</td>
              </tr>
              <tr>
                <td>90</td>
                <td>35</td>
                <td>32.9</td>
                <td>0.0188</td>
                <td>0.0244</td>
                <td>0.8943</td>
                <td>4.1</td>
                <td>0.1206</td>
              </tr>
              <tr>
                <td rowspan="3">RUL-Mamba</td>
                <td>50</td>
                <td>75</td>
                <td>75.8</td>
                <td>0.0083</td>
                <td>0.0134</td>
                <td>
                  <bold>0.9901</bold>
                </td>
                <td>
                  <bold>0.8</bold>
                </td>
                <td>0.0135</td>
              </tr>
              <tr>
                <td>70</td>
                <td>55</td>
                <td>55.9</td>
                <td>0.0091</td>
                <td>0.0150</td>
                <td>0.9770</td>
                <td>
                  <bold>0.9</bold>
                </td>
                <td>
                  <bold>0.0167</bold>
                </td>
              </tr>
              <tr>
                <td>90</td>
                <td>35</td>
                <td>34.5</td>
                <td>0.0092</td>
                <td>0.0161</td>
                <td>0.9556</td>
                <td>2.5</td>
                <td>0.0735</td>
              </tr>
              <tr>
                <td rowspan="3">Ours</td>
                <td>50</td>
                <td>75</td>
                <td>76</td>
                <td>
                  <bold>0.0081</bold>
                </td>
                <td>
                  <bold>0.0132</bold>
                </td>
                <td>0.9848</td>
                <td>1.0</td>
                <td>
                  <bold>0.0133</bold>
                </td>
              </tr>
              <tr>
                <td>70</td>
                <td>55</td>
                <td>56</td>
                <td>
                  <bold>0.0082</bold>
                </td>
                <td>
                  <bold>0.0135</bold>
                </td>
                <td>
                  <bold>0.9816</bold>
                </td>
                <td>1.0</td>
                <td>0.0182</td>
              </tr>
              <tr>
                <td>90</td>
                <td>35</td>
                <td>36</td>
                <td>
                  <bold>0.0085</bold>
                </td>
                <td>
                  <bold>0.0144</bold>
                </td>
                <td><bold>0.9640</bold></td>
                <td><bold>1.0</bold></td>
                <td>
                  <bold>0.0286</bold>
                </td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>The bold formatting is used to highlight the best results for the metrics in the table according to the number of SP. RUL: Remaining useful life; NASA: National Aeronautics and Space Administration; SP: starting point of prediction; TRUL: average value of true RUL; PRUL: average value of predicted RUL; MAE: mean absolute error; RMSE: root mean square error; R<sup>2</sup>: coefficient of determination; AE: average absolute error of 10 experiments; RE: relative error.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>For the TJU dataset, which includes multivariate health indicators such as voltage and current statistics across different charge–discharge phases, the experiments focused on evaluating multivariate time-series prediction performance. As shown in <xref ref-type="fig" rid="fig8">Figure 8</xref> and <xref ref-type="table" rid="t6">Table 6</xref>, conventional Transformer-based models achieved relatively good fitting performance but still suffered from inconsistencies and higher errors across starting points. In contrast, the RUL-Mamba model effectively exploited temporal dependencies among variables, producing very low prediction errors. Building on this, the proposed CGHF-MDH-Mamba model achieved further improvement, reducing the MAE to 0.0009 and yielding an RUL deviation of only one cycle from the ground truth. These results indicate that, in complex multivariate conditions, the CGHF’s redundant feature compression and MDH’s trend constraint mechanisms significantly enhance generalization capability.</p>
        <fig id="fig8" position="float">
          <label>Figure 8</label>
          <caption>
            <p>Comparison between predicted and measured battery capacity trajectories on the TJU dataset under different prediction starting points. Comparison curve between predicted value and true value when (A) SP = 200; (B) SP = 300; (C) SP = 400. TJU: Tongji University; SP: starting point.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="ir6015.fig.8.jpg" />
        </fig>
        <table-wrap id="t6">
          <label>Table 6</label>
          <caption>
            <p>RUL prediction results of different models with multivariate inputs on TJU dataset</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Dataset</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Method</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>SP</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>TRUL</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PRUL</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>MAE (Ah)</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>RMSE (Ah)</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>R<sup>2</sup></bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>AE (cycles)</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>RE</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td rowspan="27">TJU</td>
                <td rowspan="3">Autoformer</td>
                <td>200</td>
                <td>579</td>
                <td>580.4</td>
                <td>0.0020</td>
                <td>0.0028</td>
                <td>0.9997</td>
                <td>1.6</td>
                <td>0.0028</td>
              </tr>
              <tr>
                <td>300</td>
                <td>479</td>
                <td>478.6</td>
                <td>0.0031</td>
                <td>0.0042</td>
                <td>0.9989</td>
                <td>3.2</td>
                <td>0.0067</td>
              </tr>
              <tr>
                <td>400</td>
                <td>379</td>
                <td>376.6</td>
                <td>0.0038</td>
                <td>0.0051</td>
                <td>0.9975</td>
                <td>4.4</td>
                <td>0.0116</td>
              </tr>
              <tr>
                <td rowspan="3">FEDformer</td>
                <td>200</td>
                <td>579</td>
                <td>581.2</td>
                <td>0.0020</td>
                <td>0.0028</td>
                <td>0.9997</td>
                <td>2.2</td>
                <td>0.0038</td>
              </tr>
              <tr>
                <td>300</td>
                <td>479</td>
                <td>481.5</td>
                <td>0.0030</td>
                <td>0.0039</td>
                <td>0.9990</td>
                <td>2.5</td>
                <td>0.0052</td>
              </tr>
              <tr>
                <td>400</td>
                <td>379</td>
                <td>380.2</td>
                <td>0.0034</td>
                <td>0.0045</td>
                <td>0.9980</td>
                <td>3.2</td>
                <td>0.0085</td>
              </tr>
              <tr>
                <td rowspan="3">PathFormer</td>
                <td>200</td>
                <td>579</td>
                <td>569.2</td>
                <td>0.0093</td>
                <td>0.0123</td>
                <td>0.9938</td>
                <td>9.8</td>
                <td>0.0170</td>
              </tr>
              <tr>
                <td>300</td>
                <td>479</td>
                <td>467.4</td>
                <td>0.0105</td>
                <td>0.0148</td>
                <td>0.9868</td>
                <td>11.6</td>
                <td>0.0243</td>
              </tr>
              <tr>
                <td>400</td>
                <td>379</td>
                <td>364.4</td>
                <td>0.0144</td>
                <td>0.0199</td>
                <td>0.9641</td>
                <td>14.6</td>
                <td>0.0386</td>
              </tr>
              <tr>
                <td rowspan="3">TimesNet</td>
                <td>200</td>
                <td>579</td>
                <td>580.0</td>
                <td>0.0161</td>
                <td>0.0202</td>
                <td>0.9832</td>
                <td>1.0</td>
                <td>0.0017</td>
              </tr>
              <tr>
                <td>300</td>
                <td>479</td>
                <td>479.1</td>
                <td>0.0145</td>
                <td>0.0177</td>
                <td>0.9812</td>
                <td><bold>0.1</bold></td>
                <td><bold>0.0002</bold></td>
              </tr>
              <tr>
                <td>400</td>
                <td>379</td>
                <td>378.3</td>
                <td>0.0129</td>
                <td>0.0154</td>
                <td>0.9787</td>
                <td><bold>0.7</bold></td>
                <td><bold>0.0019</bold></td>
              </tr>
              <tr>
                <td rowspan="3">TimeMixer</td>
                <td>200</td>
                <td>579</td>
                <td>582.2</td>
                <td>0.0120</td>
                <td>0.0147</td>
                <td>0.9900</td>
                <td>12.0</td>
                <td>0.0208</td>
              </tr>
              <tr>
                <td>300</td>
                <td>479</td>
                <td>456.3</td>
                <td>0.0195</td>
                <td>0.0236</td>
                <td>0.9630</td>
                <td>35.1</td>
                <td>0.0734</td>
              </tr>
              <tr>
                <td>400</td>
                <td>379</td>
                <td>334.4</td>
                <td>0.0271</td>
                <td>0.0308</td>
                <td>0.8992</td>
                <td>51.4</td>
                <td>0.1360</td>
              </tr>
              <tr>
                <td rowspan="3">PatchTST</td>
                <td>200</td>
                <td>579</td>
                <td>574.8</td>
                <td>0.0087</td>
                <td>0.0113</td>
                <td>0.9947</td>
                <td>8.8</td>
                <td>0.0152</td>
              </tr>
              <tr>
                <td>300</td>
                <td>479</td>
                <td>456.6</td>
                <td>0.0206</td>
                <td>0.0233</td>
                <td>0.9640</td>
                <td>22.8</td>
                <td>0.0477</td>
              </tr>
              <tr>
                <td>400</td>
                <td>379</td>
                <td>334.9</td>
                <td>0.0326</td>
                <td>0.0347</td>
                <td>0.8740</td>
                <td>44.1</td>
                <td>0.1167</td>
              </tr>
              <tr>
                <td rowspan="3">MambaLithium</td>
                <td>200</td>
                <td>579</td>
                <td>580.9</td>
                <td>0.0064</td>
                <td>0.0082</td>
                <td>0.9970</td>
                <td>4.7</td>
                <td>0.0081</td>
              </tr>
              <tr>
                <td>300</td>
                <td>479</td>
                <td>472.3</td>
                <td>0.0088</td>
                <td>0.0110</td>
                <td>0.9919</td>
                <td>6.7</td>
                <td>0.0140</td>
              </tr>
              <tr>
                <td>400</td>
                <td>379</td>
                <td>354.3</td>
                <td>0.0178</td>
                <td>0.0197</td>
                <td>0.9631</td>
                <td>24.7</td>
                <td>0.0653</td>
              </tr>
              <tr>
                <td rowspan="3">RUL-Mamba</td>
                <td>200</td>
                <td>579</td>
                <td>581.6</td>
                <td>0.0014</td>
                <td>0.0022</td>
                <td>0.9998</td>
                <td>2.6</td>
                <td>0.0045</td>
              </tr>
              <tr>
                <td>300</td>
                <td>479</td>
                <td>481.6</td>
                <td>0.0015</td>
                <td>0.0023</td>
                <td>0.9997</td>
                <td>2.6</td>
                <td>0.0054</td>
              </tr>
              <tr>
                <td>400</td>
                <td>379</td>
                <td>381.6</td>
                <td>0.0016</td>
                <td>0.0024</td>
                <td>0.9995</td>
                <td>2.6</td>
                <td>0.0069</td>
              </tr>
              <tr>
                <td rowspan="3">Ours</td>
                <td>200</td>
                <td>579</td>
                <td>580.0</td>
                <td><bold>0.0009</bold></td>
                <td><bold>0.0015</bold></td>
                <td><bold>0.9999</bold></td>
                <td><bold>1.0</bold></td>
                <td><bold>0.0017</bold></td>
              </tr>
              <tr>
                <td>300</td>
                <td>479</td>
                <td>480.0</td>
                <td><bold>0.0010</bold></td>
                <td><bold>0.0016</bold></td>
                <td><bold>0.9999</bold></td>
                <td>1.0</td>
                <td>0.0021</td>
              </tr>
              <tr>
                <td>400</td>
                <td>379</td>
                <td>380.0</td>
                <td><bold>0.0010</bold></td>
                <td><bold>0.0016</bold></td>
                <td><bold>0.9998</bold></td>
                <td>1.0</td>
                <td>0.0026</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>The bold formatting is used to highlight the best results for the metrics in the table according to the number of SP. RUL: Remaining useful life; TJU: Tongji University; SP: starting point of prediction; TRUL: average value of true RUL; PRUL: average value of predicted RUL; MAE: mean absolute error; RMSE: root mean square error; R<sup>2</sup>: coefficient of determination; AE: average absolute error of 10 experiments; RE: relative error.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>Overall, the experimental results demonstrate that, for univariate input scenarios (NASA dataset), the RUL-Mamba model already exhibits strong prediction capability, while the proposed model further improves both prediction accuracy and physical consistency. For multivariate input scenarios (TJU dataset), the inclusion of CGHF and MDH modules significantly enhances the model’s ability to select and represent multidimensional degradation features, achieving the best performance across all starting points. These findings confirm that the CGHF-MDH-Mamba model maintains strong adaptability and generalization under various data characteristics and operating conditions.</p>
      </sec>
      <sec id="sec4-4">
        <title>4.4. Ablation study</title>
        <p>To quantify the contribution of each module to the performance improvement of the proposed battery RUL prediction model, a systematic ablation study was conducted. The experiments were performed on the TJU dataset by progressively integrating different modules. Starting from the baseline model, the MDH, fusion, VSN, and CGHF modules were added one by one, and the final results were compared with the complete model. The detailed results are shown in <xref ref-type="table" rid="t7">Table 7</xref>.</p>
        <table-wrap id="t7">
          <label>Table 7</label>
          <caption>
            <p>Comparison of ablation experiment results</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Method</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>SP</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>MAE (Ah)</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>RMSE (Ah)</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>R<sup>2</sup></bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>AE (cycles)</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>RE</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Inference time/s</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td rowspan="3">Base model</td>
                <td>200</td>
                <td>0.0014</td>
                <td>0.0022</td>
                <td>0.9998</td>
                <td>2.6</td>
                <td>0.0045</td>
                <td>0.203</td>
              </tr>
              <tr>
                <td>300</td>
                <td>0.0015</td>
                <td>0.0023</td>
                <td>0.9997</td>
                <td>2.6</td>
                <td>0.0054</td>
                <td>0.152</td>
              </tr>
              <tr>
                <td>400</td>
                <td>0.0016</td>
                <td>0.0024</td>
                <td>0.9995</td>
                <td>2.6</td>
                <td>0.0069</td>
                <td>0.126</td>
              </tr>
              <tr>
                <td rowspan="3">Base model + MDH</td>
                <td>200</td>
                <td>0.0018</td>
                <td>0.0021</td>
                <td>0.9998</td>
                <td>1.4</td>
                <td>0.0024</td>
                <td>0.171</td>
              </tr>
              <tr>
                <td>300</td>
                <td>0.0018</td>
                <td>0.0022</td>
                <td>0.9997</td>
                <td>1.4</td>
                <td>0.0029</td>
                <td>0.128</td>
              </tr>
              <tr>
                <td>400</td>
                <td>0.0018</td>
                <td>0.0022</td>
                <td>0.9995</td>
                <td>1.4</td>
                <td>0.0037</td>
                <td>0.110</td>
              </tr>
              <tr>
                <td rowspan="3">Base model + fusion + MDH</td>
                <td>200</td>
                <td>0.0016</td>
                <td>0.0020</td>
                <td>0.9998</td>
                <td>1.2</td>
                <td>0.0021</td>
                <td>0.166</td>
              </tr>
              <tr>
                <td>300</td>
                <td>0.0016</td>
                <td>0.0020</td>
                <td>0.9998</td>
                <td>1.2</td>
                <td>0.0025</td>
                <td>0.127</td>
              </tr>
              <tr>
                <td>400</td>
                <td>0.0016</td>
                <td>0.0020</td>
                <td>0.9996</td>
                <td>1.2</td>
                <td>0.0032</td>
                <td>0.105</td>
              </tr>
              <tr>
                <td rowspan="3">Base model + VSN + fusion + MDH</td>
                <td>200</td>
                <td>0.0012</td>
                <td>0.0016</td>
                <td>0.9999</td>
                <td>1.0</td>
                <td>0.0017</td>
                <td>0.177</td>
              </tr>
              <tr>
                <td>300</td>
                <td>0.0012</td>
                <td>0.0017</td>
                <td>0.9998</td>
                <td>1.0</td>
                <td>0.0021</td>
                <td>0.129</td>
              </tr>
              <tr>
                <td>400</td>
                <td>0.0012</td>
                <td>0.0017</td>
                <td>0.9997</td>
                <td>1.0</td>
                <td>0.0026</td>
                <td>0.105</td>
              </tr>
              <tr>
                <td rowspan="3">Base model + CGHF + VSN + fusion + MDH</td>
                <td>200</td>
                <td>0.0009</td>
                <td>0.0015</td>
                <td>0.9999</td>
                <td>1.0</td>
                <td>0.0017</td>
                <td>0.167</td>
              </tr>
              <tr>
                <td>300</td>
                <td>0.0010</td>
                <td>0.0016</td>
                <td>0.9999</td>
                <td>1.0</td>
                <td>0.0021</td>
                <td>0.119</td>
              </tr>
              <tr>
                <td>400</td>
                <td>0.0010</td>
                <td>0.0016</td>
                <td>0.9998</td>
                <td>1.0</td>
                <td>0.0026</td>
                <td>0.102</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>SP: Starting point; MAE: mean absolute error; RMSE: root mean square error; R<sup>2</sup>: coefficient of determination; AE: absolute error; RE: relative error; MDH: monotonic decreasing head; VSN: variable selection network; CGHF: channel-grouping half-convolution.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>As observed from the results, the baseline model already achieved reasonably stable prediction performance in terms of MAE and RMSE, but the AE in RUL estimation remained relatively high. After introducing the MDH module, MAE and RMSE improved slightly, while AE dropped significantly. This indicates that MDH enhances the consistency between predicted and actual RUL values and enforces the physical law of monotonic capacity degradation.</p>
        <p>When the fusion gating mechanism was added on top of the Baseline + MDH structure, the model combined local and global contextual representations, improving the smoothness and stability of the predicted curves. The approach reduces fluctuations caused by overreliance on instantaneous features. On this basis, incorporating the VSN module led to a more substantial improvement-MAE dropped to 0.0012. This demonstrates that the VSN effectively suppresses noisy features and emphasizes key signals sensitive to degradation trends, thereby enhancing both prediction accuracy and interpretability in multivariable input scenarios.</p>
        <p>Overall, after adding the CGHF module, the model achieved the best performance across all three starting points, with the lowest MAE reaching 0.0009, RMSE remaining around 0.0015, and AE controlled within one cycle. The CGHF module balances local feature extraction and channel residual connection through grouped half-convolution. Assisted by SE attention, it strengthens the response to key channels, making the overall feature representation more compact and effective. Together with the VSN’s sparse variable selection, this ensures strong robustness under high-dimensional feature conditions.</p>
        <p>Moreover, inference efficiency was compared in the ablation experiments. It was found that even after adding multiple modules, the increase in inference time remained within a controllable range. The complete model maintained inference latency between 0.1 and 0.2 s. This demonstrates that the proposed approach achieves high prediction accuracy without significantly compromising computational efficiency, indicating potential suitability for online monitoring scenarios, subject to further validation under diverse operating conditions.</p>
        <p>Collectively, the ablation results confirm that MDH is indispensable for maintaining physical consistency. The fusion and VSN modules enhance the expressiveness and robustness of temporal features, while CGHF further optimizes local modeling and channel feature selection. These components complement each other, enabling the complete CGHF-MDH-Mamba model to achieve an optimal balance among prediction accuracy, physical interpretability, and inference efficiency.</p>
      </sec>
    </sec>
    <sec id="sec5">
      <title>5. CONCLUSIONS</title>
      <p>This paper proposes a unified framework for lithium-ion battery lifetime prediction that integrates CGHF, VSN, Mamba state-space modeling, and a MDH. Experimental results on the NASA and TJU datasets show that the proposed method provides competitive prediction accuracy while maintaining physical consistency and interpretability, summarized in three aspects as follows:</p>
      <p>(1) Feature modeling: The CGHF and VSN modules contribute to local temporal feature extraction and multivariable sparse selection, respectively, effectively reducing redundancy and emphasizing critical features.</p>
      <p>(2) Sequence modeling: The Mamba module efficiently captures long-range dependencies through a state-space recurrence mechanism, improving the model’s ability to represent full-lifecycle degradation trends.</p>
      <p>(3) Prediction constraint: The MDH module introduces a monotonic decreasing constraint and an adaptive gating mechanism at the output stage, ensuring that the predictions follow electrochemical principles and reducing the deviation between predicted and actual RUL values.</p>
      <p>Nevertheless, this work has several limitations. The datasets used in this study are primarily collected under controlled laboratory conditions, lacking the variability of real-world operating environments such as fluctuating temperatures, dynamic loads, and measurement noise. Although cross-dataset validation partially demonstrates generalization, further evaluation under diverse industrial conditions is necessary. In addition, while the proposed MDH introduces physical constraints that improve robustness, its effectiveness under extreme or highly non-stationary conditions requires further investigation. Future work will focus on large-scale real-world datasets and adaptive modeling strategies for complex operating scenarios.</p>
    </sec>
  </body>
  <back>
    <sec>
      <title>DECLARATIONS</title>
      <sec>
        <title>Authors’ contributions</title>
        <p>Writing - original draft, software, investigation, methodology, validation, data curation: Zhou, X.</p>
        <p>Supervision, conceptualization, writing - review and editing, resources, project administration, funding acquisition: Li, Y.</p>
        <p>Investigation, methodology, visualization: Han, W.</p>
        <p>Formal analysis, software, validation: Zhong, F.</p>
        <p>Data curation, formal analysis, writing - review and editing: Zhang, Z.</p>
        <p>Validation, visualization, resources: Tong, R.</p>
        <p>Conceptualization, methodology, supervision, writing - review and editing: Huang, L.</p>
        <p>All authors have read and agreed to the published version of the manuscript.</p>
      </sec>
      <sec>
        <title>Availability of data and materials</title>
        <p>The original contributions presented in this study are included in the article. Further inquiries can be directed to the corresponding author.</p>
      </sec>
      <sec>
        <title>AI and AI-assisted tools statement</title>
        <p>Not applicable.</p>
      </sec>
      <sec>
        <title>Financial support and sponsorship</title>
        <p>This research was funded by The Science and Technology Project of Southern Power Grid Company, Research on the Key Technology of Highly Refreshed Digital Twins and Large Depth Cable Detection in Power Conduit Corridors-Subject 1: Research on Key Technology of Highly Refreshed Digital Twins in Power Conduit Corridors (No. 030117KC23110003).</p>
      </sec>
      <sec>
        <title>Conflicts of interest</title>
        <p>Huang, L. serves as an Editorial Board Member of the journal <italic>Intelligence</italic> &amp; <italic>Robotics</italic>. He was not involved in any steps of editorial processing, notably including reviewers’ selection, manuscript handling, or decision making. Li, Y.; Zhou, X.; Zhong, F.; Han, W.; Zhang, Z.; and Tong, R. are affiliated with Guangzhou Power Supply Bureau of Guangdong Power Grid Co., Ltd.</p>
      </sec>
      <sec>
        <title>Ethical approval and consent to participate</title>
        <p>Not applicable.</p>
      </sec>
      <sec>
        <title>Consent for publication</title>
        <p>Not applicable.</p>
      </sec>
      <sec>
        <title>Copyright</title>
        <p>© The Author(s) 2026.</p>
      </sec>
    </sec>
    <ref-list>
      <ref id="B1">
        <label>1</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Sun</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Jiang</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Gu</surname>
              <given-names>Z</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>A novel multiple kernel extreme learning machine model for remaining useful life prediction of lithium-ion batteries</article-title>
          <source>J Power Sources</source>
          <year>2024</year>
          <volume>613</volume>
          <fpage>234912</fpage>
          <pub-id pub-id-type="doi">10.1016/j.jpowsour.2024.234912</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B2">
        <label>2</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>YT</given-names>
            </name>
            <name>
              <surname>Chen</surname>
              <given-names>LF</given-names>
            </name>
            <name>
              <surname>Su</surname>
              <given-names>XH</given-names>
            </name>
            <name>
              <surname>Zhou</surname>
              <given-names>SB</given-names>
            </name>
          </person-group>
          <article-title>Remaining useful life prediction of lithium-ion batteries based on IMM-PFF</article-title>
          <source>Acta Electron Sin</source>
          <year>2025</year>
          <volume>53</volume>
          <fpage>1520</fpage>
          <lpage>32</lpage>
          <pub-id pub-id-type="doi">10.12263/DZXB.20241130</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B3">
        <label>3</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Madani</surname>
              <given-names>SS</given-names>
            </name>
            <name>
              <surname>Shabeer</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Fowler</surname>
              <given-names>M</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Artificial intelligence and digital twin technologies for intelligent lithium-ion battery management systems</article-title>
          <source>Batteries</source>
          <year>2025</year>
          <volume>11</volume>
          <fpage>298</fpage>
          <pub-id pub-id-type="doi">10.3390/batteries11080298</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B4">
        <label>4</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Jia</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Ren</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Yun</surname>
              <given-names>P</given-names>
            </name>
            <name>
              <surname>Xue</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Mi</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Research on optimization of hybrid energy storage capacity using ensemble empirical mode ecomposition and fuzzy control</article-title>
          <source>Acta Energ Sol Sin</source>
          <year>2023</year>
          <volume>44</volume>
          <fpage>239</fpage>
          <lpage>46</lpage>
          <pub-id pub-id-type="doi">10.19912/j.0254-0096.tynxb.2021-1070</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B5">
        <label>5</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhu</surname>
              <given-names>ZW</given-names>
            </name>
            <name>
              <surname>Miao</surname>
              <given-names>JW</given-names>
            </name>
            <name>
              <surname>Zhu</surname>
              <given-names>XY</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Research progress in remaining useful life prediction of lithium-ion batteries based on machine learning</article-title>
          <source>Energy Storage Sci Technol</source>
          <year>2024</year>
          <volume>13</volume>
          <fpage>3134</fpage>
          <lpage>49</lpage>
          <pub-id pub-id-type="doi">10.19799/j.cnki.2095-4239.2024.0713</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B6">
        <label>6</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>JF</given-names>
            </name>
            <name>
              <surname>Mo</surname>
              <given-names>WQ</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>XL</given-names>
            </name>
          </person-group>
          <article-title>A review of remaining useful life prediction for lithium-ion batteries based on data-driven method</article-title>
          <source>J Power Supply</source>
          <year>2025</year>
          <volume>23</volume>
          <fpage>253</fpage>
          <lpage>65</lpage>
          <pub-id pub-id-type="doi">10.13234/j.issn.2095-2805.2025.7.253</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B7">
        <label>7</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Ahwiadi</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>A smart evolving fuzzy predictor with customized firefly optimization for battery RUL prediction</article-title>
          <source>Batteries</source>
          <year>2025</year>
          <volume>11</volume>
          <fpage>362</fpage>
          <pub-id pub-id-type="doi">10.3390/batteries11100362</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B8">
        <label>8</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Demirci</surname>
              <given-names>O</given-names>
            </name>
            <name>
              <surname>Taskin</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Schaltz</surname>
              <given-names>E</given-names>
            </name>
            <name>
              <surname>Acar Demirci</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Review of battery state estimation methods for electric vehicles-Part II: SOH estimation</article-title>
          <source>J Energy Storage</source>
          <year>2024</year>
          <volume>96</volume>
          <fpage>112703</fpage>
          <pub-id pub-id-type="doi">10.1016/j.est.2024.112703</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B9">
        <label>9</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Tian</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>D</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>A novel dual gated recurrent unit neural network based on error compensation integrated with Kalman filter for the state of charge estimation of parallel battery modules</article-title>
          <source>J Power Sources</source>
          <year>2025</year>
          <volume>635</volume>
          <fpage>236508</fpage>
          <pub-id pub-id-type="doi">10.1016/j.jpowsour.2025.236508</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B10">
        <label>10</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Liu</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Yin</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Improved particle filter algorithm for remaining useful life prediction of lithium-ion batteries</article-title>
          <source>Power Syst Prot Control</source>
          <year>2024</year>
          <volume>52</volume>
          <fpage>124</fpage>
          <lpage>31</lpage>
          <pub-id pub-id-type="doi">10.19783/j.cnki.pspc.231034</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B11">
        <label>11</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Qiang</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Ding</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>A prediction framework for state of health of lithium-ion batteries based on improved support vector regression</article-title>
          <source>J Electrochem Soc</source>
          <year>2023</year>
          <volume>170</volume>
          <fpage>110517</fpage>
          <pub-id pub-id-type="doi">10.1149/1945-7111/ad050e</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B12">
        <label>12</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Qaadan</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Alshare</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Popp</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Schmuelling</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Prediction of lithium-ion battery health using GRU-BPP</article-title>
          <source>Batteries</source>
          <year>2024</year>
          <volume>10</volume>
          <fpage>399</fpage>
          <pub-id pub-id-type="doi">10.3390/batteries10110399</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B13">
        <label>13</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhao</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Sun</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Liang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Remaining useful life prediction for lithium-ion batteries based on hybrid ensembles allied with data-driven approach</article-title>
          <source>Energies</source>
          <year>2025</year>
          <volume>18</volume>
          <fpage>1114</fpage>
          <pub-id pub-id-type="doi">10.3390/en18051114</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B14">
        <label>14</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Qian</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Zou</surname>
              <given-names>Q</given-names>
            </name>
            <name>
              <surname>Cao</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>SOH and RUL estimation for lithium-ion batteries based on partial charging curve features</article-title>
          <source>Energies</source>
          <year>2025</year>
          <volume>18</volume>
          <fpage>3248</fpage>
          <pub-id pub-id-type="doi">10.3390/en18133248</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B15">
        <label>15</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Wang</surname>
              <given-names>XM</given-names>
            </name>
            <name>
              <surname>He</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>LL</given-names>
            </name>
            <name>
              <surname>Wu</surname>
              <given-names>HB</given-names>
            </name>
            <name>
              <surname>Xu</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Zhao</surname>
              <given-names>WG</given-names>
            </name>
          </person-group>
          <article-title>RUL prediction for lithium-ion batteries based on DWD-SVR model</article-title>
          <source>Acta Energ Sol Sin</source>
          <year>2025</year>
          <volume>46</volume>
          <fpage>52</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.19912/j.0254-0096.tynxb.2023-1737</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B16">
        <label>16</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Cai</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Jiang</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Han</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Zhao</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>Multi-step prediction of online lithium battery remaining useful life based on GRNN-GSA-ELM</article-title>
          <source>J Mech Eng</source>
          <year>2024</year>
          <volume>60</volume>
          <fpage>296</fpage>
          <lpage>308</lpage>
          <pub-id pub-id-type="doi">10.3901/JME.2024.24.296</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B17">
        <label>17</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Sun</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>A method for predicting the remaining life of lithium-ion batteries based on an improved Dempster–Shafer evidence theory framework</article-title>
          <source>Energies</source>
          <year>2025</year>
          <volume>18</volume>
          <fpage>3370</fpage>
          <pub-id pub-id-type="doi">10.3390/en18133370</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B18">
        <label>18</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Sun</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Zhai</surname>
              <given-names>QC</given-names>
            </name>
          </person-group>
          <article-title>A novel remaining useful life prediction method based on fusion feature and OOA-BiGRU for lithium-ion batteries</article-title>
          <source>Trans China Electrotech Soc</source>
          <year>2025</year>
          <volume>40</volume>
          <fpage>2996</fpage>
          <lpage>3012</lpage>
          <pub-id pub-id-type="doi">10.19595/j.cnki.1000-6753.tces.241243</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B19">
        <label>19</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Lv</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Ma</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Bao</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Indirect prediction of lithium-ion battery RUL based on CEEMDAN and CNN-BiGRU</article-title>
          <source>Energies</source>
          <year>2024</year>
          <volume>17</volume>
          <fpage>1704</fpage>
          <pub-id pub-id-type="doi">10.3390/en17071704</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B20">
        <label>20</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Niu</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Tian</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Liang</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Remaining useful life prediction of PEMFC based on 2-layer bidirectional LSTM network</article-title>
          <source>World Electr Veh J</source>
          <year>2025</year>
          <volume>16</volume>
          <fpage>511</fpage>
          <pub-id pub-id-type="doi">10.3390/wevj16090511</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B21">
        <label>21</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Liu</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Ji</surname>
              <given-names>CL</given-names>
            </name>
            <name>
              <surname>Cao</surname>
              <given-names>LJ</given-names>
            </name>
            <name>
              <surname>Wu</surname>
              <given-names>XY</given-names>
            </name>
            <name>
              <surname>Duan</surname>
              <given-names>YF</given-names>
            </name>
          </person-group>
          <article-title>Prediction of remaining service life of lithium-ion batteries based on complete ensemble empirical mode decomposition with adaptive noise and BiLSTM-Transformer</article-title>
          <source>Power Syst Prot Control</source>
          <year>2024</year>
          <volume>52</volume>
          <fpage>167</fpage>
          <lpage>77</lpage>
          <pub-id pub-id-type="doi">10.19783/j.cnki.pspc.231507</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B22">
        <label>22</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Mou</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Yang</surname>
              <given-names>Q</given-names>
            </name>
            <name>
              <surname>Tang</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Yu</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Prediction of the remaining useful life of lithium-ion batteries based on the 1D CNN-BLSTM neural network</article-title>
          <source>Batteries</source>
          <year>2024</year>
          <volume>10</volume>
          <fpage>152</fpage>
          <pub-id pub-id-type="doi">10.3390/batteries10050152</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B23">
        <label>23</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Lithium battery lifespan prediction method integrating dynamic convolution transformer and CMA-ES</article-title>
          <source>Acta Energ Sol Sin</source>
          <year>2025</year>
          <volume>46</volume>
          <fpage>1</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.19912/j.0254-0096.tynxb.2024-2097</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B24">
        <label>24</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Sun</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>An</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Huang</surname>
              <given-names>C</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Battery life evaluation method based on temporal convolution network</article-title>
          <source>Adv Eng Sci</source>
          <year>2025</year>
          <volume>57</volume>
          <fpage>259</fpage>
          <lpage>68</lpage>
          <pub-id pub-id-type="doi">10.12454/j.jsuese.202300930</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B25">
        <label>25</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Yin</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Sun</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Qian</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Transfer learning DAE-LSTM for remaining useful life prediction of Li-ion batteries</article-title>
          <source>Trans China Electrotech Soc</source>
          <year>2024</year>
          <volume>39</volume>
          <fpage>290</fpage>
          <lpage>302</lpage>
          <pub-id pub-id-type="doi">10.19595/j.cnki.1000-6753.tces.221890</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B26">
        <label>26</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Saleem</surname>
              <given-names>U</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Riaz</surname>
              <given-names>S</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>TransRUL: a transformer-based multihead attention model for enhanced prediction of battery remaining useful life</article-title>
          <source>Energies</source>
          <year>2024</year>
          <volume>17</volume>
          <fpage>3976</fpage>
          <pub-id pub-id-type="doi">10.3390/en17163976</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B27">
        <label>27</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Capoglu</surname>
              <given-names>EU</given-names>
            </name>
            <name>
              <surname>Taherkhani</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>A comparison of different transformer models for time series prediction</article-title>
          <source>Information</source>
          <year>2025</year>
          <volume>16</volume>
          <fpage>878</fpage>
          <pub-id pub-id-type="doi">10.3390/info16100878</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B28">
        <label>28</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhu</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Shi</surname>
              <given-names>N</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Yang</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>A lithium-ion battery remaining useful life prediction method based on mode decomposition and informer-LSTM</article-title>
          <source>Electronics</source>
          <year>2025</year>
          <volume>14</volume>
          <fpage>3886</fpage>
          <pub-id pub-id-type="doi">10.3390/electronics14193886</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B29">
        <label>29</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Ma</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Gao</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Remaining useful life prediction for solid-state lithium batteries based on spatial–temporal relations and neuronal ODE-assisted KAN</article-title>
          <source>Reliab Eng Syst Saf</source>
          <year>2025</year>
          <volume>260</volume>
          <fpage>111003</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ress.2025.111003</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B30">
        <label>30</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Jiang</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Hu</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Chen</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Huang</surname>
              <given-names>Q</given-names>
            </name>
            <name>
              <surname>He</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>A robust adapted flexible parallel neural network architecture for early prediction of lithium battery lifespan</article-title>
          <source>Energy</source>
          <year>2024</year>
          <volume>308</volume>
          <fpage>132840</fpage>
          <pub-id pub-id-type="doi">10.1016/j.energy.2024.132840</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B31">
        <label>31</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhou</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Huang</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Life prediction of lithium battery based on particle filter and BP neural network</article-title>
          <source>J Phys Conf Ser</source>
          <year>2024</year>
          <volume>2814</volume>
          <fpage>012047</fpage>
          <pub-id pub-id-type="doi">10.1088/1742-6596/2814/1/012047</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B32">
        <label>32</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Huang</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Zhao</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>RUL-Mamba: Mamba-based remaining useful life prediction for lithium-ion batteries</article-title>
          <source>J Energy Storage</source>
          <year>2025</year>
          <volume>120</volume>
          <fpage>116376</fpage>
          <pub-id pub-id-type="doi">10.1016/j.est.2025.116376</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B33">
        <label>33</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Liu</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Min</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Song</surname>
              <given-names>J</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Channel grouping vision transformer for lightweight fruit and vegetable recognition</article-title>
          <source>Expert Syst Appl</source>
          <year>2025</year>
          <volume>292</volume>
          <fpage>128636</fpage>
          <pub-id pub-id-type="doi">10.1016/j.eswa.2025.128636</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B34">
        <label>34</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Liang</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Zhao</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Early prediction of remaining useful life for lithium-ion batteries with the state space model</article-title>
          <source>Energies</source>
          <year>2024</year>
          <volume>17</volume>
          <fpage>6326</fpage>
          <pub-id pub-id-type="doi">10.3390/en17246326</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B35">
        <label>35</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Liao</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Lv</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Hu</surname>
              <given-names>Q</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Review on aging risk assessment and life prediction technology of lithium energy storage batteries</article-title>
          <source>Energies</source>
          <year>2024</year>
          <volume>17</volume>
          <fpage>3668</fpage>
          <pub-id pub-id-type="doi">10.3390/en17153668</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B36">
        <label>36</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Hu</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Shen</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Sun</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <comment>Squeeze-and-excitation networks. In <italic>2018 IEEE/CVF Conference on Computer Vision and Pattern Recognition</italic>, Salt Lake City, USA. Jun 18-23, 2018. IEEE; 2018. pp. 7132-41.</comment>
          <pub-id pub-id-type="doi">10.1109/CVPR.2018.00745</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>