﻿<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.0 20120330//EN" "http://jats.nlm.nih.gov/publishing/1.0/JATS-journalpublishing1.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="nlm-ta">Intell. Robot.</journal-id>
      <journal-id journal-id-type="publisher-id">IR</journal-id>
      <journal-title-group>
        <journal-title>Intelligence &amp; Robotics</journal-title>
      </journal-title-group>
      <issn pub-type="epub">2770-3541</issn>
      <publisher>
        <publisher-name>OAE Publishing Inc.</publisher-name>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.20517/ir.2026.19</article-id>
	  <article-id pub-id-type="publisher-id">IR-2026-013001</article-id>
      <article-categories>
        <subj-group>
          <subject>Research Article</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Label co-occurrence guided nonlinear disambiguation for partial multi-label learning</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author">
          <name>
            <surname>Song</surname>
            <given-names>Yining</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
          <xref ref-type="aff" rid="I#">
            <sup>#</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Qi</surname>
            <given-names>Fuyu</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
          <xref ref-type="aff" rid="I#">
            <sup>#</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Fan</surname>
            <given-names>Jinfu</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Feng</surname>
            <given-names>Jian</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Li</surname>
            <given-names>Zhiyong</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Bu</surname>
            <given-names>Qingkai</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Lu</surname>
            <given-names>Wenpeng</given-names>
          </name>
          <xref ref-type="aff" rid="I2">
            <sup>2</sup>
          </xref>
          <xref ref-type="aff" rid="I3">
            <sup>3</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author" corresp="yes">
          <name>
            <surname>Huang</surname>
            <given-names>Linqing</given-names>
          </name>
          <xref ref-type="aff" rid="I4">
            <sup>4</sup>
          </xref>
          <xref ref-type="corresp" rid="cor1" />
        </contrib>
      </contrib-group>
      <aff id="I1">
        <sup>1</sup>School of Computer Science and Technology, Qingdao University, Qingdao 266071, Shandong, China.</aff>
      <aff id="I2">
        <sup>2</sup>Key Laboratory of Computing Power Network and Information Security, Ministry of Education, Shandong Computer Science Center, Qilu University of Technology (Shandong Academy of Sciences), Jinan 250000, Shandong, China.</aff>
      <aff id="I3">
        <sup>3</sup>Shandong Provincial Key Laboratory of Computing Power Internet and Service Computing, Shandong Fundamental Research Center for Computer Science, Jinan 250000, Shandong, China.</aff>
      <aff id="I4">
        <sup>4</sup>School of Computer Science, Shanghai Jiao Tong University, Shanghai 200240, China.</aff>
      <aff id="I#">
        <sup>#</sup>These authors contributed equally to this work.</aff>
      <author-notes>
        <corresp id="cor1">Correspondence to: Prof. Linqing Huang, School of Computer Science, Shanghai Jiao Tong University, Shanghai 200240, China. E-mail: <email>huanglinqing@sjtu.edu.cn</email></corresp>
        <fn fn-type="other">
          <p>
            <bold>Received:</bold> 30 Jan 2026 | <bold>First Decision:</bold> 3 Apr 2026 | <bold>Revised:</bold> 23 Apr 2026 | <bold>Accepted:</bold> 24 Jun 2026 | <bold>Published:</bold> 30 Jun 2026</p>
        </fn>
        <fn fn-type="other">
          <p>
            <bold>Academic Editor:</bold> Hao Zhang | <bold>Copy Editor:</bold> Pei-Yun Wang | <bold>Production Editor:</bold> Pei-Yun Wang</p>
        </fn>
      </author-notes>
      <pub-date pub-type="ppub">
        <year>2026</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>30</day>
        <month>6</month>
        <year>2026</year>
      </pub-date>
      <volume>6</volume>
	  <issue>2</issue>
      <fpage>368</fpage>
	  <lpage>95</lpage>
      <permissions>
        <copyright-statement>© The Author(s) 2026.</copyright-statement>
        <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
          <license-p>© The Author(s) 2026. <bold>Open Access</bold> This article is licensed under a Creative Commons Attribution 4.0 International License (<uri xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</uri>), which permits unrestricted use, sharing, adaptation, distribution and reproduction in any medium or format, for any purpose, even commercially, as long as you give appropriate credit to the original author(s) and the source, provide a link to the Creative Commons license, and indicate if changes were made.</license-p>
        </license>
      </permissions>
      <abstract>
        <p>Partial multi-label learning (PML) addresses challenges where each instance is associated with a set of candidate labels that includes both relevant and irrelevant ones. Traditional label disambiguation strategies often overlook the importance of nonlinear subspace structures. The assumption that data points closely adhere to multiple linear subspaces is restrictive and may not hold in certain applications. Linear subspace clustering algorithms frequently struggle with data that lie on multiple nonlinear manifolds, because they focus only on global linear relationships between data points. To address this gap, we propose a novel approach called label co-occurrence guided nonlinear disambiguation for partial multi-label learning (LCND). Specifically, we introduce a label weight-guided kernel low-rank representation to learn an instance affinity matrix in a nonlinear feature space, enabling effective identification of instances with complex nonlinear structures. Meanwhile, we design a weighted Jaccard distance to quantify label relevance by exploiting label frequency and co-occurrence information. By jointly optimizing instance-level and label-level affinity matrices, the proposed method effectively denoises labels under weak supervision. Extensive experimental results demonstrate that LCND significantly outperforms most state-of-the-art PML methods on the vast majority of benchmark datasets and evaluation metrics.</p>
      </abstract>
      <kwd-group>
        <kwd>Partial multi-label learning</kwd>
        <kwd>weakly supervised learning</kwd>
        <kwd>multi-label learning</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec id="sec1">
      <title>1. INTRODUCTION</title>
      <p>In the domain of supervised machine learning, multi-label learning (MLL) addresses situations where a single entity can be associated with multiple categories simultaneously<sup>[<xref ref-type="bibr" rid="B1">1</xref>-<xref ref-type="bibr" rid="B3">3</xref>]</sup>. Standard MLL algorithms typically require exhaustive label data for the training dataset<sup>[<xref ref-type="bibr" rid="B1">1</xref>]</sup>, and it is imperative that each training sample be precisely annotated. However, accurately annotating such instances is extremely challenging. Because obtaining completely correct label annotations is time-consuming and labor-intensive<sup>[<xref ref-type="bibr" rid="B4">4</xref>-<xref ref-type="bibr" rid="B6">6</xref>]</sup>, the collected labels are often incomplete, containing both correct and superfluous labels. This scenario has been defined as partial multi-label learning (PML) by<sup>[<xref ref-type="bibr" rid="B7">7</xref>]</sup>.</p>
      <p>To tackle the challenges of PML, employing multi-label classification techniques such as BR<sup>[<xref ref-type="bibr" rid="B8">8</xref>]</sup>, ML-kNN<sup>[<xref ref-type="bibr" rid="B9">9</xref>]</sup>, and CPLST<sup>[<xref ref-type="bibr" rid="B10">10</xref>]</sup> is a viable strategy. However, the presence of noisy labels in the candidate label set can severely distort the training process<sup>[<xref ref-type="bibr" rid="B3">3</xref>,<xref ref-type="bibr" rid="B11">11</xref>]</sup>.</p>
      <p>To address these challenges, various PML techniques have been proposed in recent years<sup>[<xref ref-type="bibr" rid="B12">12</xref>]</sup>. Many PML methods focus on exploiting the intrinsic properties of both the feature and label spaces. In the label decomposition process of PML-LRS<sup>[<xref ref-type="bibr" rid="B13">13</xref>]</sup>, part of the label matrix is assumed to be a low-rank ground-truth label matrix, while the other part is treated as a sparse matrix of irrelevant labels. GLC<sup>[<xref ref-type="bibr" rid="B14">14</xref>]</sup> introduces a label coefficient matrix via low-rank representation (LRR) to capture the global structural information of labels from multiple subspaces. Some methods attempt to reduce the impact of noise in the feature matrix through low-rank and sparse decomposition schemes. Additionally, PML-NI<sup>[<xref ref-type="bibr" rid="B15">15</xref>]</sup> considers the origin of noisy labels, arguing that they typically stem from the ambiguity of instance content. PAMB<sup>[<xref ref-type="bibr" rid="B16">16</xref>]</sup> transforms the PML problem into multiple binary decomposition problems. However, these methods share a critical limitation: when jointly exploiting information from the instance and label spaces<sup>[<xref ref-type="bibr" rid="B17">17</xref>]</sup>, they largely overlook the nonlinear subspace structures inherent in real-world data. Forcing features that reside in nonlinear subspaces to be modeled as linear can lead to inaccurate semantic spaces for instances or labels. Furthermore, the instance space and the label space are inherently strongly connected, yet the joint role of candidate labels and instances remains underexplored.</p>
      <p>A new PML technique, designated as label co-occurrence guided nonlinear disambiguation for partial multi-label learning (LCND), has been introduced to solve the challenges outlined above. Recently, LRR<sup>[<xref ref-type="bibr" rid="B18">18</xref>,<xref ref-type="bibr" rid="B19">19</xref>]</sup> has garnered substantial interest due to its exceptional proficiency in subspace clustering. This approach assumes that high-dimensional data lie close to a union of several low-dimensional linear subspaces. Nonetheless, LRR may fail to produce optimal results with data originating from nonlinear subspaces, as it was initially designed for handling linear subspaces within the input domain<sup>[<xref ref-type="bibr" rid="B20">20</xref>]</sup>. Certain PML techniques that leverage LRR attempt to resolve label ambiguities by decomposing the candidate label matrix into an ideal component and a noise-based component<sup>[<xref ref-type="bibr" rid="B13">13</xref>]</sup>. However, this approach fails to capture the nonlinear interconnections of the data, leading to a loss of local data features and similarity cues during the learning process. Meanwhile, it has been demonstrated that nonlinear subspace learning significantly enhances similarity estimation, as supported by<sup>[<xref ref-type="bibr" rid="B21">21</xref>]</sup>. Numerous researchers have integrated nonlinear subspaces into their studies to demonstrate their effectiveness. Tanfous <italic>et al.</italic> proposed that suitable shape representations and their temporal evolution, termed trajectories, often lie on nonlinear manifolds<sup>[<xref ref-type="bibr" rid="B22">22</xref>]</sup>. Roweis <italic>et al.</italic> introduced locally linear embedding (LLE) by exploiting the local symmetries of linear reconstructions<sup>[<xref ref-type="bibr" rid="B23">23</xref>]</sup>. Using this methodology, LLE can discern the overarching structure of nonlinear manifolds. Conventional linear subspace clustering techniques frequently encounter difficulties when processing data that span multiple nonlinear manifolds. Such challenges are expected, as these methodologies primarily account for global linear correlations among data points. In the context of nonlinear manifolds, the intricate local interactions among data points play a more significant role<sup>[<xref ref-type="bibr" rid="B24">24</xref>]</sup>. Inspired by this research, to overcome the limitations of linear models, we employ a kernel-based mapping technique to project data from the original input space into a feature space using the robust kernel low-rank representation (RKLRR)<sup>[<xref ref-type="bibr" rid="B20">20</xref>]</sup> method. In this transformed feature space, data points are likely to be distributed across various linear subspaces. Subsequently, we can derive an instance affinity matrix, ensuring that instances sharing the same labels lie in the same subspace. In our study, we propose a novel label disambiguation method that incorporates the Jaccard distance to measure similarity between candidate labels, thereby constructing a label affinity matrix. Furthermore, we demonstrate that by integrating this matrix with an instance affinity matrix, our approach effectively harnesses complementary information, thereby enhancing the accuracy and reliability of the label disambiguation.</p>
      <p>To summarize our findings, this research makes several key contributions:<break/>1. We propose a novel method for learning instance affinity matrices by exploring nonlinear subspace data and candidate label information. Using kernel methods for high-dimensional mapping, this approach effectively identifies instances that share the same label, even when the original nonlinear subspace data cause them to lie in multiple linear subspaces.<break/>2. We design a weighted Jaccard distance for label affinity modeling, where label weights are adaptively learned based on label frequency and co-occurrence statistics. This method captures implicit label hierarchies without requiring additional annotations, thereby improving label denoising accuracy.<break/>3. We develop a joint optimization framework for instance-level and label-level affinity matrices, fully leveraging their complementary information to address the insufficient joint utilization of label and instance data in existing PML methods.</p>
    </sec>
    <sec id="sec2">
      <title>2. RELATED WORK</title>
      <sec id="sec2-1">
        <title>2.1. Partial label learning</title>
        <p>In the field of weakly supervised learning, partial label learning (PLL)<sup>[<xref ref-type="bibr" rid="B25">25</xref>-<xref ref-type="bibr" rid="B27">27</xref>]</sup> differs from both supervised and unsupervised learning. Its core objective is to identify a single ground-truth label for each instance from a set of candidate labels<sup>[<xref ref-type="bibr" rid="B28">28</xref>]</sup>. In PLL, each candidate label set contains exactly one ground-truth label and several noisy labels. Existing PLL methods can be categorized into three strategies: label disambiguation, label transformation, and theory-driven methods.</p>
        <p>Label disambiguation techniques primarily include mean-based methods and recognition-based methods<sup>[<xref ref-type="bibr" rid="B29">29</xref>]</sup>. One type of mean-based method<sup>[<xref ref-type="bibr" rid="B30">30</xref>]</sup> proposes a convex optimization approach, where predictions are obtained by averaging the model outputs over all candidate labels. Another method performs vote aggregation on the candidate label sets of neighboring samples of unseen instances<sup>[<xref ref-type="bibr" rid="B31">31</xref>-<xref ref-type="bibr" rid="B33">33</xref>]</sup>. Recognition-based PLL methods<sup>[<xref ref-type="bibr" rid="B34">34</xref>-<xref ref-type="bibr" rid="B36">36</xref>]</sup> treat the ground-truth label as a latent variable and infer the most probable label by constructing a parametric model. In recent years, this approach has been integrated with advanced representation learning techniques such as contrastive learning<sup>[<xref ref-type="bibr" rid="B37">37</xref>]</sup> and graph neural networks<sup>[<xref ref-type="bibr" rid="B38">38</xref>]</sup>.</p>
        <p>The label transformation strategy<sup>[<xref ref-type="bibr" rid="B39">39</xref>,<xref ref-type="bibr" rid="B40">40</xref>]</sup> aims to mitigate the impact of false-positive labels on the candidate set. Theory-driven methods focus on the theoretical foundations of PLL, addressing core issues such as statistical consistency<sup>[<xref ref-type="bibr" rid="B41">41</xref>-<xref ref-type="bibr" rid="B43">43</xref>]</sup>. Additionally, PLL research has been extended to scenarios including class imbalance, multi-view learning, online learning, high-dimensional data, and dimensionality reduction.</p>
        <p>The essence of label disambiguation lies in extracting ground-truth label information by evaluating the credibility of candidate labels. Furthermore, PML significantly increases problem complexity, as the number of ground-truth labels in each candidate label set is unknown, whereas PLL assumes a single ground-truth label.</p>
      </sec>
      <sec id="sec2-2">
        <title>2.2. PML</title>
        <p>PML addresses the scenario in which each training instance is annotated with a candidate label set that contains both ground-truth labels and irrelevant noisy labels<sup>[<xref ref-type="bibr" rid="B7">7</xref>]</sup>. A naive strategy is to treat all candidate labels as correct and apply conventional MLL algorithms such as ML-KNN<sup>[<xref ref-type="bibr" rid="B9">9</xref>]</sup>. However, the presence of noisy labels severely degrades the performance of such approaches. To overcome this limitation, numerous PML methods have been developed, which can be broadly categorized into two paradigms: two-stage disambiguation methods (TDM) and unified framework methods (UFM).</p>
        <sec id="sec2-2-1">
          <title>2.2.1. TDM</title>
          <p>TDM first identify highly reliable labels from the candidate set and subsequently train a robust multi-label classifier using the refined label confidences. Xie and Huang introduced PML-lc and PML-fp, which estimate the probability of each candidate label being ground-truth by exploiting feature-level label correlations and then rank the most relevant labels for each instance<sup>[<xref ref-type="bibr" rid="B7">7</xref>]</sup>. Zhang and Fang proposed PARTICLE, which extracts credible labels through iterative label propagation and then builds a multi-label predictor via pairwise label ranking with virtual label splitting and maximum a posteriori inference<sup>[<xref ref-type="bibr" rid="B44">44</xref>]</sup>. Wang <italic>et al.</italic> developed DRAMA, which constructs a label confidence matrix using feature manifolds and learns a gradient-boosted model to fit these confidences, augmenting the feature space with previous label predictions to capture higher-order label correlations<sup>[<xref ref-type="bibr" rid="B45">45</xref>]</sup>. Liu <italic>et al.</italic> presented PAMB, which leverages error-correcting output codes to decompose the PML problem into multiple binary classification tasks, thereby avoiding direct label confidence estimation and employing a loss-weighted decoding strategy for prediction<sup>[<xref ref-type="bibr" rid="B16">16</xref>]</sup>.</p>
          <p>Despite their effectiveness, two-stage methods suffer from an inherent limitation: errors introduced in the first stage can propagate to the second stage. This issue becomes particularly acute in datasets with high label-noise ratios, where inaccurate confidence estimates may undermine the entire learning process.</p>
        </sec>
        <sec id="sec2-2-2">
          <title>2.2.2. UFM</title>
          <p>In contrast to two-stage approaches, UFM integrate label disambiguation and model training into a single optimization process, iteratively refining the estimates of ground-truth labels during learning. A prominent line of research within this category assumes that the intrinsic relationships between labels and features can be captured in a low-rank subspace, thereby filtering out label noise<sup>[<xref ref-type="bibr" rid="B13">13</xref>,<xref ref-type="bibr" rid="B14">14</xref>,<xref ref-type="bibr" rid="B46">46</xref>]</sup>. Sun <italic>et al.</italic> proposed PML-LRS, which decomposes the candidate label matrix into a low-rank ground-truth component and a sparse noise component, and jointly learns a prediction model<sup>[<xref ref-type="bibr" rid="B13">13</xref>]</sup>. Sun <italic>et al.</italic> further introduced GLC, which integrates global label structures and global-local correlations to enhance disambiguation<sup>[<xref ref-type="bibr" rid="B14">14</xref>]</sup>. Yu <italic>et al.</italic> proposed fPML, which assumes that labels and features reside in a unified space where noise is naturally eliminated through LRR<sup>[<xref ref-type="bibr" rid="B46">46</xref>]</sup>. Xie and Huang developed PML-NI, a unified framework that simultaneously recovers ground-truth labels and identifies noisy ones by exploiting label correlations via trace norm and <italic>ℓ</italic><sub>1</sub> norm regularizers, while also modeling noise directly from feature information<sup>[<xref ref-type="bibr" rid="B15">15</xref>]</sup>. Gong <italic>et al.</italic> proposed MILI-PML, which identifies genuine labels through mutual information maximization<sup>[<xref ref-type="bibr" rid="B47">47</xref>]</sup>.</p>
          <p>Additional studies have explored complementary directions within unified frameworks. Wu <italic>et al.</italic> proposed FIMAN, which enhances feature representation and label precision by leveraging the geometry of multi-view datasets<sup>[<xref ref-type="bibr" rid="B48">48</xref>]</sup>. Hao <italic>et al.</italic> formulated PML-FSOS as a feature selection problem in the presence of noise, jointly examining the label and feature spaces<sup>[<xref ref-type="bibr" rid="B49">49</xref>]</sup>. Hang and Zhang introduced PARD, which pioneers the use of probabilistic graphical models for PML disambiguation<sup>[<xref ref-type="bibr" rid="B50">50</xref>]</sup>. Wang <italic>et al.</italic> proposed PML-ED, which uses KNN-based label attention for probabilistic distribution estimation and conditional layer normalization to capture higher-order label correlations. Recently, deep learning-based PML methods have also emerged<sup>[<xref ref-type="bibr" rid="B51">51</xref>]</sup>. Li <italic>et al.</italic> proposed PML-KGT, which incorporates a K-means graph transformer, cluster centers, and a class-aware correction loss to mitigate the effects of noisy labels<sup>[<xref ref-type="bibr" rid="B52">52</xref>]</sup>.</p>
          <p>However, despite substantial progress, most existing PML methods still assume that data lie in linear subspaces, whereas real-world data often exhibit complex nonlinear structures. Moreover, the joint exploitation of label correlations and instance-level relationships remains insufficiently explored. These limitations motivate the development of our proposed LCND framework, which integrates kernel-based nonlinear feature mapping with weighted label affinity constraints to achieve robust label disambiguation.</p>
        </sec>
      </sec>
    </sec>
    <sec id="sec3">
      <title>3. THE PROPOSED APPROACH</title>
      <p>In this section, we detail the formulation and implementation of LCND, which extends prior work<sup>[<xref ref-type="bibr" rid="B53">53</xref>]</sup> to address the nonlinear PML problem while accounting for label frequency information.</p>
      <p>We represent the feature matrix as <bold>X</bold> = [<bold>x</bold><sub>1</sub>, <bold>x</bold><sub>2</sub>, …, <bold>x</bold><italic><sub>n</sub></italic>] ∈ ℝ<italic><sup>d</sup></italic><sup>×</sup><italic><sup>n</sup></italic>, where <italic>d</italic> denotes the dimensionality of the feature vectors and <italic>n</italic> is the total number of instances. The matrix <bold>Y</bold> = [<bold>y</bold><sub>1</sub>, <bold>y</bold><sub>2</sub>, …, <bold>y</bold><italic><sub>n</sub></italic>] ∈ ℝ<italic><sup>m</sup></italic><sup>×</sup><italic><sup>n</sup></italic> captures the label assignments for the labeled samples, where <italic>m</italic> is the total number of distinct labels. An entry <italic>y<sub>ji</sub></italic> = 1 indicates that the instance <bold>x</bold><italic><sub>i</sub></italic> is annotated with the <italic>j</italic>-th label, while <italic>y<sub>ji</sub></italic> = 0 indicates the absence of that label.</p>
      <p>To predict labels for unseen instances, we learn a projection matrix <bold>W</bold> = [<bold>w</bold><sub>1</sub>, <bold>w</bold><sub>2</sub>, …, <bold>w</bold><italic><sub>d</sub></italic>] ∈ ℝ<italic><sup>m</sup></italic><sup>×</sup><italic><sup>d</sup></italic> that maps feature representations to the label space. Consequently, we optimize <bold>W</bold> by minimizing the quadratic loss as follows:</p>
      <p><disp-formula> <label>(1)</label> <tex-math id="E1"> $$  \min_{\mathbf{W}} \frac{1}{2} \|\mathbf{Y} - \mathbf{W}\mathbf{X}\|_F^2 + \beta \|\mathbf{W}\|_F^2 $$ </tex-math></disp-formula></p>
      <p>In this context, we add a squared Frobenius norm penalty to regularize <bold>W</bold>, which helps prevent overfitting, where <italic>β</italic> is a balancing parameter.</p>
      <sec id="sec3-1">
        <title>3.1. Learn nonlinear relationships</title>
        <p>LRR<sup>[<xref ref-type="bibr" rid="B54">54</xref>,<xref ref-type="bibr" rid="B55">55</xref>]</sup> addresses the subspace clustering problem by identifying the inherent subspace structures of the dataset <bold>X</bold>. The objective of LRR is to find a minimal-rank approximation of <bold>X</bold> using a suitable dictionary<sup>[<xref ref-type="bibr" rid="B18">18</xref>]</sup>, which can be formulated as follows:</p>
        <p><disp-formula> <label>(2)</label> <tex-math id="E1"> $$  \min_{\mathbf{Z}, \mathbf{E}} \|\mathbf{Z}\|_{*} + \lambda \|\mathbf{E}\|_{2,1} \\
		\text{s.t. } \mathbf{X} = \mathbf{X}\mathbf{Z} + \mathbf{E} $$ </tex-math></disp-formula></p>
        <p>Here, <italic>λ</italic> &gt; 0 is a regularization parameter, <bold>E</bold> ∈ ℝ<italic><sup>d</sup></italic><sup>×</sup><italic><sup>n</sup></italic> represents the reconstruction error, ||<bold>Z</bold>||<sub>*</sub> denotes the nuclear norm, and ||<bold>E</bold>||<sub>2,1</sub> = Σ<italic><sub>j</sub></italic><sub>=1</sub><italic><sup>n</sup></italic>(Σ<italic><sub>i</sub></italic><sub>=1</sub><italic><sup>d</sup></italic>(<italic>E<sub>ij</sub></italic>)<sup>2</sup>)<sup>1/2</sup>. The matrix <bold>Z</bold>, obtained by solving Equation (2), approximates a block-diagonal form, where instances with high similarity are grouped into the same subspace, and the magnitudes of the representation coefficients for similar instances are relatively large.</p>
        <p>The equality constraint in Equation (2) can be rewritten as <bold>E</bold> = <bold>X</bold> - <bold>XZ</bold>. Consequently, the LRR optimization problem defined in Equation (2) is equivalent to the following formulation:</p>
        <p><disp-formula> <label>(3)</label> <tex-math id="E1"> $$  \min_{\mathbf{Z}} \|\mathbf{Z}\|_*+\lambda\|\mathbf{X}-\mathbf{X}\mathbf{Z}\|_{2,1} $$ </tex-math></disp-formula></p>
        <p>Introducing an auxiliary matrix <bold>P</bold> = <bold>I</bold> - <bold>Z</bold> ∈ ℝ<italic><sup>n</sup></italic><sup>×</sup><italic><sup>n</sup></italic> allows us to express ||<bold>X</bold> - <bold>XZ</bold>||<sub>2,1</sub> from Equation (2) as ||<bold>X</bold> - <bold>XZ</bold>||<sub>2,1</sub> = ||<bold>X</bold>(<bold>I</bold> - <bold>Z</bold>)||<sub>2,1</sub> = ||<bold>XP</bold>||<sub>2,1</sub> = Σ<italic><sub>i</sub></italic><sub>=1</sub><italic><sup>n</sup></italic>||<bold>Xp<sub>i</sub></bold>|| = Σ<italic><sub>i</sub></italic><sub>=1</sub><italic><sup>n</sup></italic>(<bold>p<sub>i</sub></bold><italic><sup>T</sup></italic><bold>X</bold><italic><sup>T</sup></italic><bold>p<sub>i</sub></bold>)<sup>1/2</sup>, with <bold>P</bold> = [<bold>p</bold><sub>1</sub>, …, <bold>p</bold><italic><sub>n</sub></italic>], where <bold>p<sub>i</sub></bold> ∈ ℝ<italic><sup>n</sup></italic> is the <italic>i</italic>-th column vector of <bold>P</bold> for <italic>i</italic> = 1, …, <italic>n</italic>. Therefore, the formulation in Equation (3) can be reformulated as:</p>
        <p><disp-formula> <label>(4)</label> <tex-math id="E1"> $$ \begin{aligned}&amp;\min_{\mathbf{Z},\mathbf{P}} \|\mathbf{Z}\|_*+\lambda\sum_{i=1}^n\sqrt{\mathbf{p_i}^{T}\mathbf{X}^{T}\mathbf{X}\mathbf{p_i}}\\&amp;\mathrm{~s.t.~} \mathbf{P}=\mathbf{I}-\mathbf{Z}.\end{aligned} $$ </tex-math></disp-formula></p>
        <p>After this reformulation, once the LRR formulation in Equation (2) is transformed into Equation (4), the dataset {<bold>x<sub>i</sub></bold>}<italic><sub>i</sub></italic><sub>=1</sub><italic><sup>n</sup></italic> is represented solely through inner products (i.e., <bold>x<sub>i</sub></bold><italic><sup>T</sup></italic><bold>x<sub>j</sub></bold>) within the expression <bold>X</bold><italic><sup>T</sup></italic><bold>X</bold>. This property naturally allows the incorporation of kernel methods. Specifically, the subsequent nonlinear adaptation of LRR is obtained by substituting <bold>X</bold> in Equation (2) with Ψ(<bold>X</bold>):</p>
        <p><disp-formula> <label>(5)</label> <tex-math id="E1"> $$  \min_\mathbf{Z}\|\mathbf{Z}\|_*+\lambda\|\Psi(\mathbf{X})-\Psi(\mathbf{X})\mathbf{Z}\|_{2,1} $$ </tex-math></disp-formula></p>
        <p>Within this framework, Ψ(<bold>X</bold>) = [Ψ(<bold>x<sub>1</sub></bold>), …, Ψ(<bold>x<sub>n</sub></bold>)] denotes the feature mapping, with Ψ being the transformation Ψ: ℝ<italic><sup>d</sup></italic> → <inline-formula><tex-math id="M1">$$ \mathcal{F}  $$</tex-math></inline-formula>. The resulting space <inline-formula><tex-math id="M1">$$ \mathcal{F}  $$</tex-math></inline-formula> is called the feature space. We define the kernel matrix <bold>K</bold> ∈ ℝ<italic><sup>n</sup></italic><sup>×</sup><italic><sup>n</sup></italic> as <bold>K</bold> = Ψ(<bold>X</bold>)<italic><sup>T</sup></italic>Ψ(<bold>X</bold>). In addition, we define a function <italic>g</italic>(<bold>P</bold>) for <bold>P</bold> ∈ ℝ<italic><sup>n</sup></italic><sup>×</sup><italic><sup>n</sup></italic> as:</p>
        <p><disp-formula> <label>(6)</label> <tex-math id="E1"> $$  g(\mathbf{P})\triangleq\sum_{i=1}^n\sqrt{\mathbf{p_i}^{T}\mathbf{K}\mathbf{p_i}} $$ </tex-math></disp-formula></p>
        <p>where <bold>p<sub>i</sub></bold> ∈ ℝ<italic><sup>n</sup></italic> is the <italic>i</italic>-th column vector of <bold>P</bold> for <italic>i</italic> = 1, …, <italic>n</italic>. Then Equation (5) can be reformulated as:</p>
        <p><disp-formula> <label>(7)</label> <tex-math id="E1"> $$  \begin{aligned}&amp; \min_{\mathbf{Z},\mathbf{P}}\|\mathbf{Z}\|_*+\lambda g(\mathbf{P})\\&amp; \mathrm{~s.t.~}\mathbf{P}=\mathbf{I}-\mathbf{Z}\end{aligned} $$ </tex-math></disp-formula></p>
        <p>The kernel matrix <bold>K</bold>, incorporated into <italic>g</italic>(<bold>P</bold>), plays a crucial role. It is worth noting that using a linear kernel, i.e., <bold>K</bold> = <bold>X</bold><italic><sup>T</sup></italic><bold>X</bold>, reduces the formulation in Equation (7) to that of Equation (2), making LRR a special case of linear kernel methods. Kernel techniques facilitate the detection of complex nonlinear patterns and interactions in the dataset. This is achieved by projecting the data from the original space into a Reproducing Kernel Hilbert Space (RKHS), thereby improving the representation for the target task. With the kernel, nonlinear data structures can be effectively mapped to linearly separable subspaces in the feature space. Consequently, this allows for a comprehensive assessment of similarity between instances. Dissimilar instances, in contrast, are assigned to different subspaces with minimal cross-representation values. As a result, the learned LRR captures instance similarity, where a larger <italic>z<sub>ij</sub></italic> indicates a stronger affinity between x<italic><sub>i</sub></italic> and x<italic><sub>j</sub></italic>.</p>
      </sec>
      <sec id="sec3-2">
        <title>3.2. Learning label affinity matrix</title>
        <p>In PML, exploiting inter-instance relationships can facilitate more accurate label disambiguation. For example, if similarity assessment is based solely on feature distance, instances x<italic><sub>i</sub></italic> and x<italic><sub>j</sub></italic> might appear similar<sup>[<xref ref-type="bibr" rid="B56">56</xref>,<xref ref-type="bibr" rid="B57">57</xref>]</sup>, yet they could belong to different classes due to the empty intersection of their label sets, i.e., <italic>S<sub>i</sub></italic> ∩ <italic>S<sub>j</sub></italic> = Ø. Therefore, incorporating candidate label information helps mitigate the influence of feature-based nearest neighbors with inconsistent labels. Additionally, when instances have overlapping labels but dissimilar features, excluding these shared labels can aid the disambiguation process.</p>
        <p>However, the standard Jaccard similarity treats all labels equally and ignores the implicit label hierarchy commonly observed in real-world datasets. To address this limitation, we propose a weighted Jaccard distance that incorporates label weights derived from the label data itself, without requiring additional prior knowledge.</p>
        <p>Given the label matrix <bold>Y</bold>, we calculate the weight <italic>ω<sub>j</sub></italic> of each label <italic>j</italic> (<italic>j</italic> = 1, 2, …, <italic>m</italic>) based on two statistical properties of the matrix. First, we consider the label frequency <italic>f<sub>j</sub></italic>, which is the number of instances annotated with label <italic>j</italic> and corresponds to the sum of the <italic>j</italic>-th row of <bold>Y</bold>, i.e., <italic>f<sub>j</sub></italic> = Σ<italic><sub>i</sub></italic><sub>=1</sub><italic><sup>n</sup></italic><italic>Y<sub>j</sub></italic><sub>,</sub><italic><sub>i</sub></italic>. We define the frequency score as:</p>
        <p><disp-formula> <label>(8)</label> <tex-math id="E1"> $$  f_{sc,j} = \frac{f_j}{\max_{1 \leq k \leq m} f_k} $$ </tex-math></disp-formula></p>
        <p>Next, we introduce the label co-occurrence rate, which represents the proportion of other labels that co-occur with label <italic>j</italic> (i.e., labels that are simultaneously 1 with <italic>j</italic> in at least one instance). To compute this rate, we first construct the co-occurrence matrix <bold>Co</bold> ∈ ℝ<italic><sup>m</sup></italic><sup>×</sup><italic><sup>m</sup></italic>, where <italic>Co<sub>j</sub></italic><sub>,</sub><italic><sub>k</sub></italic> = Σ<italic><sub>i</sub></italic><sub>=1</sub><italic><sup>n</sup></italic><italic>Y<sub>j</sub></italic><sub>,</sub><italic><sub>i</sub></italic> × <italic>Y<sub>k</sub></italic><sub>,</sub><italic><sub>i</sub></italic> denotes the number of instances in which labels <italic>j</italic> and <italic>k</italic> co-occur. We denote the co-occurrence rate as <italic>c<sub>sc</sub></italic><sub>,</sub><italic><sub>j</sub></italic>, and it is calculated as:</p>
        <p><disp-formula> <label>(9)</label> <tex-math id="E1"> $$  c_{sc,j} = \frac{\text{the count of labels } k \text{ satisfying } Co_{j,k} > 0}{m-1} $$ </tex-math></disp-formula></p>
        <p>The final label weight is obtained by combining the frequency score and the co-occurrence rate using a balancing parameter <italic>η</italic>. We first compute the initial weight as initial_<italic>ω<sub>j</sub></italic> = <italic>η</italic>·<italic>f<sub>sc</sub></italic><sub>,</sub><italic><sub>j</sub></italic> + (1 - <italic>η</italic>)·<italic>c<sub>sc</sub></italic><sub>,</sub><italic><sub>j</sub></italic>, and then normalize these initial weights so that they sum to one, resulting in <inline-formula><tex-math id="M1">$$ \omega _j=\frac{\mathrm{initial}\_\omega _j}{\sum_{k=1}^m\mathrm{initial}\_\omega _k} $$</tex-math></inline-formula>. Here, labels with higher frequency and co-occurrence rate (i.e., more general labels) receive larger <italic>ω<sub>j</sub></italic> values, while specific or rare labels receive smaller <italic>ω<sub>j</sub></italic> values, which aligns with the implicit hierarchical structure of labels.</p>
        <p>Using the label weights <italic>ω<sub>j</sub></italic>, we define the weighted Jaccard distance between label sets <italic>S<sub>i</sub></italic> and <italic>S<sub>j</sub></italic> (where <italic>S<sub>i</sub></italic> denotes the set of labels associated with instance <italic>i</italic>) as:</p>
        <p><disp-formula> <label>(10)</label> <tex-math id="E1"> $$  J_{\omega}(S_i,S_j) = \frac{\sum_{l \in S_i \cup S_j} \omega_l - \sum_{l \in S_i \cap S_j} \omega_l}{\sum_{l \in S_i \cup S_j} \omega_l} \in [0,1]  $$ </tex-math></disp-formula></p>
        <p>Compared with the standard Jaccard distance, the weighted variant emphasizes informative labels while suppressing the influence of rare or noisy labels.</p>
        <p>Finally, the label affinity matrix <bold>H</bold> = [<italic>h<sub>ij</sub></italic>]<italic><sub>n</sub></italic><sub>×</sub><italic><sub>n</sub></italic> is defined as:</p>
        <p><disp-formula> <label>(11)</label> <tex-math id="E1"> $$  h_{ij} = 1 - J_{\omega}(S_i,S_j) $$ </tex-math></disp-formula></p>
        <p>where <italic>h<sub>ij</sub></italic> represents the likelihood that instances <bold>x</bold><italic><sub>i</sub></italic> and <bold>x</bold><italic><sub>j</sub></italic> share ground-truth labels.</p>
        <p>Notably, the label weights <italic>ω<sub>j</sub></italic> and the label weight similarity <italic>sim<sub>ω</sub></italic>(<italic>i</italic>, <italic>j</italic>) defined in this section are further integrated with the Gaussian kernel to construct a label weight-guided fused kernel matrix <bold>K</bold>, which underpins the subsequent nonlinear LRR. The formal definition of <bold>K</bold> is:</p>
        <p><disp-formula> <label>(12)</label> <tex-math id="E1"> $$  \mathbf{K}(i,j) = \theta \cdot e^{-\gamma\|\mathbf{x}_i-\mathbf{x}_j\|^2} + (1-\theta) \cdot sim_{\omega}(i,j) $$ </tex-math></disp-formula></p>
        <p>where <italic>θ</italic> balances the feature and label similarity, and <italic>γ</italic> &gt; 0 is the Gaussian kernel bandwidth. <bold>K</bold> is positive semi-definite, ensuring compatibility with the low-rank optimization framework. Specifically, <italic>sim<sub>ω</sub></italic>(<italic>i</italic>, <italic>j</italic>) quantifies label-based instance relevance and is computed as:</p>
        <p><disp-formula> <label>(13)</label> <tex-math id="E1"> $$  sim_{\omega}(i,j) = \frac{\sum_{l \in S_i \cap S_j} \omega_l}{\sum_{l \in S_i \cup S_j} \omega_l} $$ </tex-math></disp-formula></p>
      </sec>
      <sec id="sec3-3">
        <title>3.3. Predictor</title>
        <p>Specifically, the intrinsic information present in potential label data can enhance the accuracy of subspace clustering. For instance, instances <bold>x<sub>i</sub></bold> and <bold>x<sub>j</sub></bold> may be distinct due to the absence of shared labels, i.e., <italic>S<sub>i</sub></italic> ∩ <italic>S<sub>j</sub></italic> = Ø. Consequently, the corresponding <italic>z<sub>ij</sub></italic> values for these instances are forced to be negligible, either zero or nearly so. Based on this rationale, we incorporate a novel term ||Z○H||<sub>1</sub><sup>2</sup><sup>[<xref ref-type="bibr" rid="B58">58</xref>]</sup>, which integrates the potential label information, where <bold>H</bold> ∈ ℝ<italic><sup>n</sup></italic><sup>×</sup><italic><sup>n</sup></italic> represents the label affinity matrix.</p>
        <p>By combining the above components, LCND is defined as follows:</p>
        <p><disp-formula> <label>(14)</label> <tex-math id="E1"> $$  \begin{aligned}&amp;\min_{\mathbf{W},\mathbf{Z},\mathbf{P}}\|\mathbf{Z}\|_*+\lambda g(\mathbf{P})+\frac12\|\mathbf{Y}-\mathbf{W}\mathbf{X}\mathbf{Z}\|_F^2  + \alpha\left\|\mathbf{Z}\circ\mathbf{H}\right\|_1^2+\beta\|\mathbf{W}\|_F^2\\&amp;\mathrm{~~s.t.~}\mathbf{P}=\mathbf{I}-\mathbf{Z}
		\end{aligned} $$ </tex-math></disp-formula></p>
        <p>where <italic>α</italic> is a regularization parameter that controls the strength of the weak supervision constraint. Specifically, after obtaining the optimal projection matrix <bold>W</bold> through training, the predicted label vector for an unseen test sample <bold>x</bold><italic><sub>t</sub></italic> is generated as <bold>y</bold><italic><sub>t</sub></italic> = <bold>Wx</bold><italic><sub>t</sub></italic>. The final label set is then determined by applying a threshold or by selecting the labels with the highest confidence scores.</p>
      </sec>
      <sec id="sec3-4">
        <title>3.4. Solving the optimization problem</title>
        <p>Introducing auxiliary variables <bold>J</bold>, <bold>U</bold>, and <bold>V</bold> allows us to restructure the objective function in Equation (14) as follows:</p>
        <p><disp-formula> <label>(15)</label> <tex-math id="E1"> $$  \begin{aligned}&amp;\underset{\mathbf{W}, \mathbf{V}, \mathbf{J}, \mathbf{Z}, \mathbf{U}, \mathbf{P}}{\min} \|\mathbf{J}\|_* + \lambda g(\mathbf{P}) + \alpha \left\|\mathbf{U} \circ \mathbf{H}\right\|_1^2  + \frac{1}{2}\|\mathbf{Y} - \mathbf{W}\mathbf{X}\mathbf{V}\|_F^2 + \beta\|\mathbf{W}\|_F^2 \\&amp;\mathrm{~~~~~s.t.~} \quad \mathbf{P} = \mathbf{I} - \mathbf{Z}\end{aligned} $$ </tex-math></disp-formula></p>
        <p>The augmented lagrange multiplier (ALM) method<sup>[<xref ref-type="bibr" rid="B59">59</xref>]</sup> is then employed to handle the following augmented Lagrangian function:</p>
        <p><disp-formula> <label>(16)</label> <tex-math id="E1"> $$  \begin{aligned}  
			&amp;\mathcal{L} = \|\mathbf{J}\|_* + \lambda g(\mathbf{P}) + \alpha \left\|\mathbf{U} \circ \mathbf{H}\right\|_1^2 + \frac{1}{2}\|\mathbf{Y} - \mathbf{W}\mathbf{X}\mathbf{V}\|_F^2  + \beta\|\mathbf{W}\|_F^2   \\
			&amp;+ \operatorname{tr}\left(\mathbf{Y}_{1}^{\mathrm{T}}(\mathbf{I} - \mathbf{Z} - \mathbf{P})\right) + \operatorname{tr}\left(\mathbf{Y}_{2}^{T}(\mathbf{Z} - \mathbf{J})\right) + \operatorname{tr}\left(\mathbf{Y}_{3}^{T}(\mathbf{Z} - \mathbf{U})\right) + \operatorname{tr}\left(\mathbf{Y}_{4}^{T}(\mathbf{Z} - \mathbf{V})\right) \\
			&amp; + \frac{\mu}{2}\left(\|\mathbf{I} - \mathbf{Z} - \mathbf{P}\|_{F}^{2} + \|\mathbf{Z} - \mathbf{J}\|_{F}^{2} + \|\mathbf{Z} - \mathbf{U}\|_{F}^{2} + \|\mathbf{Z} - \mathbf{V}\|_{F}^{2}\right) \\
			&amp;= \|\mathbf{J}\|_* + \lambda g(\mathbf{P}) + \alpha \left\|\mathbf{U} \circ \mathbf{H}\right\|_1^2 + \frac{1}{2}\|\mathbf{Y} - \mathbf{W}\mathbf{X}\mathbf{V}\|_F^2   + \beta\|\mathbf{W}\|_F^2 + \\
			&amp;\frac{\mu}{2}\left(\|\mathbf{I} - \mathbf{Z} - \mathbf{P} + \frac{\mathbf{Y}_{1}}{\mu}\|_{F}^{2} + \|\mathbf{Z} - \mathbf{J} + \frac{\mathbf{Y}_{2}}{\mu}\|_{F}^{2} \right.  \left. + \|\mathbf{Z} - \mathbf{U} + \frac{\mathbf{Y}_{3}}{\mu}\|_{F}^{2} + \|\mathbf{Z} - \mathbf{V} + \frac{\mathbf{Y}_{4}}{\mu}\|_{F}^{2}\right) \\
			&amp;+\frac{1}{2\mu}(\|\mathbf{Y}_{1}\|_{F}^{2}+\|\mathbf{Y}_{2}\|_{F}^{2}+\|\mathbf{Y}_{3}\|_{F}^{2}+\|\mathbf{Y}_{4}\|_{F}^{2}) 
		\end{aligned} $$ </tex-math></disp-formula></p>
        <p>where <bold>Y</bold><sub>1</sub>, <bold>Y</bold><sub>2</sub>, <bold>Y</bold><sub>3</sub>, and <bold>Y</bold><sub>4</sub> are all <italic>N</italic> × <italic>N</italic> matrices in ℝ<italic><sup>N</sup></italic><sup>×</sup><italic><sup>N</sup></italic> and serve as the Lagrange multipliers. Additionally, <italic>μ</italic> &gt; 0 is a penalty parameter.</p>
        <p>The optimization problem in Equation (11) can be solved iteratively by alternating minimization over the following subproblems:</p>
        <p>(1) Optimize <bold>W</bold> while holding other parameters constant: With <bold>V</bold>, <bold>J</bold>, <bold>Z</bold>, <bold>U</bold>, and <bold>P</bold> fixed, the update equation for <bold>W</bold> is obtained by differentiating Equation (17):</p>
        <p><disp-formula> <label>(17)</label> <tex-math id="E1"> $$  \min_{\mathbf{W}}
			\frac12\|\mathbf{Y}-\mathbf{W}\mathbf{X}\mathbf{V}\|_F^2+\beta\|\mathbf{W}\|_F^2  $$ </tex-math></disp-formula></p>
        <p>This corresponds to a standard linear regression problem, whose solution can be determined as follows:</p>
        <p><disp-formula> <label>(18)</label> <tex-math id="E1"> $$  \mathbf{W}=\left(\mathbf{Y}\mathbf{V}^T\mathbf{X}^T\right)\left(\mathbf{X}\mathbf{V}\mathbf{V}^T\mathbf{X}^T+2\beta \mathbf{I}_d\right)^{-1} $$ </tex-math></disp-formula></p>
        <p>(2) Optimize <bold>V</bold> while holding other parameters constant: The task of updating <bold>V</bold> can be treated as a standard linear regression problem, and its solution can be expressed as:</p>
        <p><disp-formula> <label>(19)</label> <tex-math id="E1"> $$  \mathbf{V}=\begin{bmatrix}\left(\mathbf{WX}\right)^\textbf{T}\left(\mathbf{WX}\right)+\mu \mathbf{I}\end{bmatrix}^{-1}\begin{bmatrix}\left(\mathbf{WX}\right)^\textbf{T}\mathbf{Y}+\mu\mathbf{Z} +\mathbf{Y}_4\end{bmatrix} $$ </tex-math></disp-formula></p>
        <p>(3) Optimize <bold>J</bold> while holding other parameters constant: With <bold>W</bold>, <bold>V</bold>, <bold>Z</bold>, <bold>U</bold>, and <bold>P</bold> fixed, the optimization of Equation (16) with respect to <bold>J</bold> reduces to the following problem:</p>
        <p><disp-formula> <label>(20)</label> <tex-math id="E1"> $$  \min_{\mathbf{J}}\left\|\mathbf{J}\right\|_*+\frac {\mu}{2}\left\|\mathbf{Z}-\mathbf{J}+\frac{\mathbf{Y}_2}\mu\right\|_F^2 $$ </tex-math></disp-formula></p>
        <p>The objective in Equation (20) can be equivalently written as:</p>
        <p><disp-formula> <label>(21)</label> <tex-math id="E1"> $$  \min_{\mathbf{J}}\frac12\left\|\mathbf{J}-\left(\mathbf{Z}+\frac{\mathbf{Y}_2}\mu\right)\right\|_F^2+\frac1\mu\left\|\mathbf{J}\right\|_* $$ </tex-math></disp-formula></p>
        <p>Optimizing the objective function in Equation (21) involves performing singular value decomposition (SVD) on the matrix <bold>Z</bold> + <bold>Y</bold><sub>2</sub>/<italic>μ</italic>, followed by applying soft thresholding to the resulting singular values.</p>
        <p>(4) Optimize <bold>Z</bold> while holding other parameters constant: This is an ordinary least squares regression problem. Its solution is:</p>
        <p><disp-formula> <label>(22)</label> <tex-math id="E1"> $$  \mathbf{Z}=(\mathbf{I}-\mathbf{P}+\mathbf{J}+\mathbf{U}+\mathbf{V})/4+(\mathbf{Y}_{1}-\mathbf{Y}_{2}-\mathbf{Y}_{3}-\mathbf{Y}_{4})/(4\mu) $$ </tex-math></disp-formula></p>
        <p>(5) Next, update <bold>U</bold> with the other variables fixed:</p>
        <p><disp-formula> <label>(23)</label> <tex-math id="E1"> $$  \mathbf{U}_{k+1} = \operatorname*{argmin}_{\mathbf{U}} \frac{\alpha}{\mu_k} \left\| \mathbf{U} \circ \mathbf{H} \right\|_1 + \frac{1}{2} \left\| \mathbf{U} - \left( \mathbf{Z}_{k+1} + \frac{\mathbf{Y}_{3,k}}{\mu_k} \right) \right\|_F^2   $$ </tex-math></disp-formula></p>
        <p>Therefore, <bold>U</bold> can be updated using Equation (24):</p>
        <p><disp-formula> <label>(24)</label> <tex-math id="E1"> $$  \mathbf{U}_{k+1}=\Psi_{\frac{\alpha\mathbf{H}}{\mu_k}}\left(\mathbf{Z}_{k+1}+\frac1{\mu_k}\mathbf{Y}_{3,k}\right) $$ </tex-math></disp-formula></p>
        <p>where the function <inline-formula><tex-math id="M1">$$ \Psi _{\frac{\alpha \mathrm{H}}{\mu_k}} $$</tex-math></inline-formula>(<bold>X</bold>) is defined as the element-wise product of max(|<bold>X</bold>| - <inline-formula><tex-math id="M1">$$ \frac{\alpha}{\mu_k} $$</tex-math></inline-formula><bold>H</bold>, <bold>0</bold>) and sgn(<bold>X</bold>), the sign function of <bold>X</bold>. Here, the update of <bold>U</bold> corresponds to a soft-thresholding operation.</p>
        <p>(6) Update <bold>P</bold> with the other variables fixed: The optimization problem for updating <bold>P</bold><italic><sub>k</sub></italic><sub>+1</sub> is formulated as follows:</p>
        <p><disp-formula> <label>(25)</label> <tex-math id="E1"> $$  \min_{\mathbf{P}} \lambda g\left(\mathbf{P}\right)+\frac{\mu_k}{2}\left\|\mathbf{P}-\mathbf{C}_{k+1}\right\|_F^2 $$ </tex-math></disp-formula></p>
        <p>where <bold>C</bold><italic><sub>k</sub></italic><sub>+1</sub> = <bold>I</bold> - <bold>Z</bold><italic><sub>k</sub></italic><sub>+1</sub> + <bold>Y</bold><sub>1,</sub><italic><sub>k</sub></italic>/<italic>μ<sub>k</sub></italic>. Note that solving the problem in Equation (25) is nontrivial, as the objective function is convex but nonsmooth. Let <bold>c</bold><italic><sub>i</sub></italic> (respectively, <bold>p</bold><italic><sub>i</sub></italic>) denote the <italic>i</italic>-th column vector of <bold>C</bold> (respectively, <bold>P</bold>), and set the scalar <italic>τ</italic> = <italic>μ<sub>k</sub></italic>/<italic>λ</italic>. Then (<italic>μ<sub>k</sub></italic>/2)||<bold>P</bold> - <bold>C</bold>||<italic><sub>F</sub></italic><sup>2</sup> can be rewritten as <italic>μ<sub>k</sub></italic>((<italic>τ</italic>/2)Σ<italic><sub>i</sub></italic><sub>=1</sub><italic><sup>n</sup></italic><italic>|</italic>|<bold>p</bold><italic><sub>i</sub> </italic>- <bold>c</bold><italic><sub>i</sub></italic>||<sup>2</sup>). Normalizing the objective function by <italic>λ</italic>, the problem stated in Equation (25) can be reformulated as:</p>
        <p><disp-formula> <label>(26)</label> <tex-math id="E1"> $$  \min_{\{\mathbf{p}_i\}_{i=1}^n}\sum_{i=1}^n\sqrt{\mathbf{p}_i^{T}\mathbf{K}\mathbf{p}_i}+\frac\tau2\sum_{i=1}^n\|\mathbf{p}_i-\mathbf{c}_i\|^2 $$ </tex-math></disp-formula></p>
        <p>The problem can be decomposed into <italic>n</italic> independent subproblems, each taking the following form:</p>
        <p><disp-formula> <label>(27)</label> <tex-math id="E1"> $$  \min_{\mathbf{p}_i}\sqrt{\mathbf{p}_i^{T}\mathbf{K}\mathbf{p}_i}+\frac\tau2\|\mathbf{p}_i-\mathbf{c}_i\|^2 $$ </tex-math></disp-formula></p>
        <p>
          <italic>Lemma 1</italic>: Let <italic>τ</italic> &gt; 0 be a scalar, <bold>b</bold> ∈ ℝ<italic><sup>q</sup></italic> a constant vector (<italic>q</italic> is a positive integer), and <bold>S</bold> = diag({<italic>s<sub>i</sub></italic>}<sub>1≤</sub><italic><sub>i</sub></italic><sub>≤</sub><italic><sub>q</sub></italic>) ∈ ℝ<italic><sup>q</sup></italic><sup>×</sup><italic><sup>q</sup></italic> a diagonal matrix whose diagonal entries <italic>s<sub>i</sub></italic> are positive and sorted in descending order. Then the optimal solution <bold>p</bold><sup>*</sup> to the following problem:</p>
        <p><disp-formula> <label>(28)</label> <tex-math id="E1"> $$  \min_{\mathbf{p}\in\mathbb{R}^q}\sqrt{\mathbf{p}^{T}\mathbf{S}^2\mathbf{p}}+\frac\tau2\|\mathbf{p}-\mathbf{b}\|^2 $$ </tex-math></disp-formula></p>
        <p>is given by</p>
        <p><disp-formula> <label>(29)</label> <tex-math id="E1"> $$  \mathbf{p}^*=\begin{cases}\left(\frac{\mathbf{S}^2}{\tau\delta}+\mathbf{I}\right)^{-1}\mathbf{b},&amp;\text{if } \|\mathbf{S}^{-1}\mathbf{b}\| > \frac{1}{\tau},\\\mathbf{0}_q,&amp;\text{otherwise.}\end{cases} $$ </tex-math></disp-formula></p>
        <p>Here, <bold>S</bold><sup>-1</sup> = diag({<italic>s<sub>i</sub></italic><sup>-1</sup>}<sub>1≤</sub><italic><sub>i</sub></italic><sub>≤</sub><italic><sub>q</sub></italic>) is the inverse of <bold>S</bold>, and the positive scalar <italic>δ</italic> satisfies:</p>
        <p><disp-formula> <label>(30)</label> <tex-math id="E1"> $$  \mathbf{b}^{T}\mathrm{diag}\left(\left\{\frac{s_i^2}{(\tau\delta+s_i^2)^2}\right\}_{1\leq i\leq q}\right)\mathbf{b}=\frac1{\tau^2}. $$ </tex-math></disp-formula></p>
        <p>In particular, when ||<bold>S</bold><sup>-1</sup><bold>b</bold>|| &gt; 1/<italic>τ</italic>, Equation (30) (with respect to <italic>δ</italic>) has a unique positive solution, which can be found via the bisection method as described in<sup>[<xref ref-type="bibr" rid="B20">20</xref>]</sup>. The proof of Lemma 1 is provided in the <inline-supplementary-material content-type="local-data" mimetype="application/pdf" xlink:href="ir6019-SupplementaryMaterials.pdf">Supplementary Materials</inline-supplementary-material>. Leveraging Lemma 1, we obtain the following theorem.</p>
        <p>
          <italic>Theorem 1</italic>: For <italic>τ</italic> &gt; 0, the optimal solution <bold>p</bold><italic><sub>i</sub></italic><sup>*</sup> to the problem in Equation (27) can be expressed as:</p>
        <p><disp-formula> <label>(31)</label> <tex-math id="E1"> $$ \mathbf{p}_i^* =  
		\begin{cases}  
			\hat{\mathbf{p}}, &amp; \text{if } \left\lVert \left[\frac{1}{\sigma_1},\ldots,\frac{1}{\sigma_{r_K}}\right]^T \circ \tilde{\mathbf{b}}_u \right\rVert > \frac{1}{\tau}, \\  
			\mathbf{c}_i - \mathbf{G}_K \tilde{\mathbf{b}}_u, &amp; \text{otherwise,}  
		\end{cases}    $$ </tex-math></disp-formula></p>
        <p>where <inline-formula><tex-math id="M1">$$ \mathbf{\tilde{b}} $$</tex-math></inline-formula><italic><sub>u</sub></italic> = <bold>G</bold><italic><sub>K</sub></italic><italic><sup>T</sup></italic><bold>c</bold><italic><sub>i</sub></italic> ∈ <inline-formula><tex-math id="M1">$$ \mathbb{R}^{r_K}  $$</tex-math></inline-formula>, and <bold>G</bold><italic><sub>K</sub></italic> ∈ <inline-formula><tex-math id="M1">$$ \mathbb{R}^{n\times r_K}  $$</tex-math></inline-formula> consists of the first <italic>r<sub>K</sub></italic> columns of <bold>G</bold>. The vector <inline-formula><tex-math id="M1">$$ \hat{\mathbf{p}} $$</tex-math></inline-formula> is defined as</p>
        <p><disp-formula> <label>(32)</label> <tex-math id="E1"> $$  \hat{\mathbf{p}} = \mathbf{c}_i - \mathbf{G}_K \Bigg( \left[\frac{\sigma_1^2}{\tau\delta+\sigma_1^2},\ldots,\frac{\sigma_{r_K}^2}{\tau\delta+\sigma_{r_K}^2}\right]^T \circ \tilde{\mathbf{b}}_u \Bigg). $$ </tex-math></disp-formula></p>
        <p>Here, <italic>δ</italic> is a positive scalar satisfying:</p>
        <p><disp-formula> <label>(33)</label> <tex-math id="E1"> $$  \tilde{\mathbf{b}}_u^{T} \mathrm{diag}\left(\left\{\frac{\sigma_i^2}{(\tau\delta+\sigma_i^2)^2}\right\}_{1\leq i\leq r_K}\right) \tilde{\mathbf{b}}_u = \frac{1}{\tau^2}. $$ </tex-math></disp-formula></p>
        <p>Specifically, if the norm ||[1/<italic>σ</italic><sub>1</sub>, …, 1/<inline-formula><tex-math id="M1">$$ \sigma _{r_K} $$</tex-math></inline-formula>]<italic><sup>T</sup></italic>○<inline-formula><tex-math id="M1">$$ \tilde{\mathbf{b}} $$</tex-math></inline-formula><italic><sub>u</sub></italic>|| exceeds 1/<italic>τ</italic>, then Equation (33) (with respect to <italic>δ</italic>) has a unique positive solution, which can be obtained using the bisection method as previously described<sup>[<xref ref-type="bibr" rid="B20">20</xref>]</sup>. The verification of Lemma 1 is detailed in the <inline-supplementary-material content-type="local-data" mimetype="application/pdf" xlink:href="ir6019-SupplementaryMaterials.pdf">Supplementary Materials</inline-supplementary-material>.</p>
        <p>For a detailed update procedure, please refer to <xref ref-type="fig" rid="alg1">Algorithm 1</xref>. The detailed update process for parameter <bold>P</bold> is presented in <xref ref-type="fig" rid="alg2">Algorithm 2</xref>.</p>
		<fig id="alg1" position="float">
          <label>Algorithm 1</label>
          <caption />
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="ir6019.alg.1.jpg" />
        </fig>
		<fig id="alg2" position="float">
          <label>Algorithm 2</label>
          <caption />
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="ir6019.alg.2.jpg" />
        </fig>
      </sec>
    </sec>
    <sec id="sec4">
      <title>4. EXPERIMENTS</title>
      <p>In this study, we conduct experiments on three real-world datasets and six synthetic datasets to demonstrate the effectiveness of the proposed LCND algorithm. This section begins with an overview of the datasets, evaluation metrics, and compared algorithms. We then present four sets of experiments designed to verify the efficacy of LCND. First, we provide a comprehensive analysis of the results from eight different methods across 21 datasets. Second, we perform ablation studies to assess the contribution of handling nonlinear challenges and leveraging label correlations in our model. Third, we evaluate the model’s sensitivity to parameter variations. Finally, we analyze the computational complexity.</p>
      <sec id="sec4-1">
        <title>4.1. Datasets</title>
        <p>We select three real-world datasets, namely <italic>music_emotion</italic>, <italic>music_style</italic><sup>[<xref ref-type="bibr" rid="B44">44</xref>]</sup>, and <italic>mirflickr</italic><sup>[<xref ref-type="bibr" rid="B60">60</xref>]</sup>. As shown in <xref ref-type="table" rid="t1">Table 1</xref>, these datasets represent real-world PML instances, where candidate labels are obtained from online users and subsequently verified to establish ground-truth labels. In addition, we consider six synthetic datasets derived from multi-label benchmarks: <italic>Bibtex</italic><sup>[<xref ref-type="bibr" rid="B61">61</xref>]</sup>, <italic>Birds</italic><sup>[<xref ref-type="bibr" rid="B62">62</xref>]</sup>, <italic>Emotions</italic><sup>[<xref ref-type="bibr" rid="B63">63</xref>]</sup>, <italic>Image</italic><sup>[<xref ref-type="bibr" rid="B9">9</xref>]</sup>, <italic>Medical</italic><sup>[<xref ref-type="bibr" rid="B64">64</xref>]</sup>, and <italic>Scene</italic><sup>[<xref ref-type="bibr" rid="B8">8</xref>]</sup>. To evaluate the robustness of our approach under different levels of label noise, we introduce a parameter <italic>r</italic> ∈ {1, 2, 3} that controls the number of false positive labels added to the candidate label set of each instance<sup>[<xref ref-type="bibr" rid="B16">16</xref>]</sup>. By applying these three noise settings to each of the six original multi-label datasets, we construct 6 × 3 = 18 synthetic PML datasets with varying noise intensities. In addition to these synthetic datasets, we also use the three real-world datasets for validation. All comparative experiments are therefore conducted across 21 benchmark datasets. The detailed characteristics of these datasets are summarized in <xref ref-type="table" rid="t2">Table 2</xref>.</p>
        <table-wrap id="t1">
          <label>Table 1</label>
          <caption>
            <p>Characteristics of the experimental data sets</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Data</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Examples</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Features</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Labels</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>AVG<sup>*</sup>CL</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>AVG<sup>*</sup>GL</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td>music_emotion</td>
                <td>6,833</td>
                <td>98</td>
                <td>11</td>
                <td>5.29</td>
                <td>2.42</td>
              </tr>
              <tr>
                <td>music_style</td>
                <td>6,839</td>
                <td>98</td>
                <td>10</td>
                <td>6.04</td>
                <td>1.44</td>
              </tr>
              <tr>
                <td>mirflickr</td>
                <td>10,433</td>
                <td>100</td>
                <td>7</td>
                <td>3.35</td>
                <td>1.77</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>These are the real-world PML data sets. AVG<sup>*</sup>CL: The average number of candidate labels. AVG<sup>*</sup>GL: the average number of ground-truth labels. PML: Partial multi-label learning.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap id="t2">
          <label>Table 2</label>
          <caption>
            <p>Multi-label data sets employed to generate synthetic PML data sets</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Data</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Examples</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Features</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Labels</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>AVG<sup>*</sup>CL</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Configurations</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td>Bibtex</td>
                <td>7,395</td>
                <td>1,836</td>
                <td>159</td>
                <td>2.40</td>
                <td rowspan="6">
                  <italic>r</italic> ∈ {1,2,3}</td>
              </tr>
              <tr>
                <td>Birds</td>
                <td>645</td>
                <td>260</td>
                <td>19</td>
                <td>1.01</td>
              </tr>
              <tr>
                <td>Emotions</td>
                <td>593</td>
                <td>72</td>
                <td>6</td>
                <td>1.87</td>
              </tr>
              <tr>
                <td>Image</td>
                <td>2,000</td>
                <td>294</td>
                <td>5</td>
                <td>1.24</td>
              </tr>
              <tr>
                <td>Medical</td>
                <td>978</td>
                <td>1,449</td>
                <td>45</td>
                <td>1.25</td>
              </tr>
              <tr>
                <td>Scene</td>
                <td>2,407</td>
                <td>294</td>
                <td>6</td>
                <td>1.08</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>Configurations: the operation of adding false positive labels to a dataset. PML: Partial multi-label learning; AVG<sup>*</sup>CL: the average number of candidate labels.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec id="sec4-2">
        <title>4.2. Experimental setup</title>
        <sec id="sec4-2-1">
          <title>4.2.1. Evaluation metrics</title>
          <p>To evaluate the performance of the eight compared algorithms, we adopt five widely used evaluation metrics: <italic>ranking loss</italic>, <italic>Hamming loss</italic>, <italic>one error</italic>, <italic>coverage</italic>, and <italic>average precision</italic>. For a comprehensive understanding of these metrics, refer to<sup>[<xref ref-type="bibr" rid="B1">1</xref>]</sup>. These metrics provide a multifaceted assessment of partial multi-label classification models. Specifically, performance improves as the values of ranking loss, Hamming loss, one error, and coverage decrease. Conversely, for average precision, a higher value indicates better performance. In addition, we use the microF1 metric<sup>[<xref ref-type="bibr" rid="B16">16</xref>]</sup>. LCND also achieves the best performance in terms of microF1. To evaluate the statistical significance of the performance differences between LCND and the best-performing baseline method, we conduct <italic>t</italic>-tests at the 0.05 significance level. The best results are highlighted in bold in the result tables.</p>
        </sec>
        <sec id="sec4-2-2">
          <title>4.2.2. Comparison with other methods</title>
          <p>To evaluate the effectiveness of the proposed LCND approach, we compare it with seven state-of-the-art PML methods and one MLL method. The methods compared are listed as follows:</p>
          <p>• ML-KNN<sup>[<xref ref-type="bibr" rid="B9">9</xref>]</sup> adapts the <italic>k</italic>-nearest neighbors approach for multi-label classification. It uses statistical information from the labels of the nearest training examples to predict label sets for unseen instances via a maximum a posteriori decision rule [suggested configuration: <italic>k</italic> = 10].</p>
          <p>• PML-lc<sup>[<xref ref-type="bibr" rid="B7">7</xref>]</sup> optimizes the label relevance order for each instance by minimizing a rank loss weighted by confidence values, which estimate the likelihood that a candidate label is a ground-truth label. It refines these confidence values by exploiting structural information in the feature and label spaces [suggested configuration: <italic>C</italic><sub>1</sub> = 1, <italic>C</italic><sub>2</sub> = 1].</p>
          <p>• PARTICLE<sup>[<xref ref-type="bibr" rid="B44">44</xref>]</sup> handles noisy and overcomplete candidate label sets using a two-stage process. It first identifies credible labels through label propagation and then induces a reliable multi-label predictor based on these labels [suggested configuration: <italic>k</italic> = 10, <italic>α</italic> = 0.95, <italic>thr</italic> = 0.9].</p>
          <p>• PAMB<sup>[<xref ref-type="bibr" rid="B16">16</xref>]</sup> learns by transforming the PML problem into multiple binary classification tasks using error-correcting output codes. It avoids direct estimation of label confidence and instead employs a loss-weighted decoding strategy for prediction [suggested configuration: <italic>L</italic> = 100log<sub>2</sub>(<italic>q</italic>)].</p>
          <p>• PML-NI<sup>[<xref ref-type="bibr" rid="B15">15</xref>]</sup> addresses PML by simultaneously recovering ground-truth labels and identifying noisy labels. It uses a unified optimization framework that exploits label correlations and directly models feature noise [suggested configuration: <italic>β</italic> = 0.5, <italic>γ</italic> = 0.5, <italic>λ</italic> = 1].</p>
          <p>• NATAL<sup>[<xref ref-type="bibr" rid="B65">65</xref>]</sup> handles PML by assuming that the given labeling information is precise, and that missing feature information can be completed. It directly learns a prediction model from the enhanced features while considering all candidate labels [suggested configuration: <italic>α</italic> = 1, <italic>β</italic> = 10<sup>-6</sup>, <italic>λ</italic> = 0.1].</p>
          <p>• PLAIN<sup>[<xref ref-type="bibr" rid="B66">66</xref>]</sup> leverages deep learning and graph techniques to disambiguate candidate label sets in PML. It uses instance-level and label-level similarities to improve label prediction accuracy [suggested configuration: <italic>K</italic> = 10, <italic>α</italic> = 0.01, <italic>β</italic> = 0.01, <italic>n</italic> = 0.1, <italic>ρ</italic> = 3].</p>
          <p>• PML-TF<sup>[<xref ref-type="bibr" rid="B67">67</xref>]</sup> is an effective transformer-based framework for PML. It introduces partial K-means cross-attention to learn discriminative label embeddings and capture local features, and designs a class-aware correction loss to mitigate label noise [suggested configuration: <italic>γ</italic> = 2].</p>
        </sec>
      </sec>
      <sec id="sec4-3">
        <title>4.3. Performance comparison</title>
        <p>The experimental work presented herein was conducted on a computing platform equipped with an octa-core processor (each core running at 2.0 GHz) and 16.0 GB of RAM. The software used for these experiments is MATLAB version R2016a.</p>
        <p>The detailed experimental results are presented in <xref ref-type="table" rid="t3">Tables 3</xref>-<xref ref-type="table" rid="t6">6</xref>. In these tables, bold text indicates that the corresponding algorithm achieved the best performance among all compared methods. Compared with the competing methods, LCND achieves superior performance in most experimental settings. PLAIN outperforms LCND in only one case, namely on the <italic>Birds</italic> dataset with respect to <italic>ranking loss</italic>.</p>
        <table-wrap id="t3">
          <label>Table 3</label>
          <caption>
            <p>Compare LCND with PML methods on real data</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Data</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>LCND</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>ML-KNN</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PML-<italic>lc</italic></bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PARTICLE</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PAMB</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PML-NI</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>NATAL</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PLAIN</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PML-TF</bold>
                </td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>Hamming Loss (the lower the better)</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td>music-emotion</td>
                <td>
                  <bold>0.208±0.010</bold>
                </td>
                <td>0.889±0.024</td>
                <td>0.241±0.006</td>
                <td>0.243±0.009</td>
                <td>
                  <bold>0.208±0.021</bold>
                </td>
                <td>0.257±0.025</td>
                <td>0.877±0.027</td>
                <td>0.281±0.018</td>
                <td>0.498±0.027</td>
              </tr>
              <tr>
                <td>music-style</td>
                <td>0.141±0.021</td>
                <td>0.855±0.028</td>
                <td>0.153±0.023</td>
                <td>0.137±0.035</td>
                <td>
                  <bold>0.123±0.031</bold>
                </td>
                <td>0.154±0.028</td>
                <td>0.493±0.035</td>
                <td>0.361±0.011</td>
                <td>0.269±0.014</td>
              </tr>
              <tr>
                <td>mirflickr</td>
                <td>0.210±0.019</td>
                <td>0.761±0.115</td>
                <td>0.209±0.012</td>
                <td>0.228±0.022</td>
                <td>
                  <bold>0.164±0.035</bold>
                </td>
                <td>0.228±0.018</td>
                <td>0.381±0.014</td>
                <td>0.236±0.026</td>
                <td>0.239±0.033</td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>Ranking Loss (the lower the better)</bold>
                </td>
              </tr>
              <tr>
                <td>music-emotion</td>
                <td>
                  <bold>0.228±0.006</bold>
                </td>
                <td>0.372±0.012</td>
                <td>0.389±0.002</td>
                <td>0.336±0.014</td>
                <td>0.234±0.021</td>
                <td>0.247±0.028</td>
                <td>0.294±0.009</td>
                <td>0.298±0.034</td>
                <td>0.233±0.032</td>
              </tr>
              <tr>
                <td>music-style</td>
                <td>0.134±0.011</td>
                <td>0.235±0.017</td>
                <td>0.699±0.025</td>
                <td>0.351±0.024</td>
                <td>0.152±0.033</td>
                <td>0.133±0.043</td>
                <td>0.302±0.051</td>
                <td>0.260±0.037</td>
                <td>
                  <bold>0.126±0.017</bold>
                </td>
              </tr>
              <tr>
                <td>mirflickr</td>
                <td>
                  <bold>0.107±0.003</bold>
                </td>
                <td>0.197±0.022</td>
                <td>0.199±0.021</td>
                <td>0.188±0.018</td>
                <td>0.136±0.016</td>
                <td>0.134±0.025</td>
                <td>0.251±0.017</td>
                <td>0.196±0.014</td>
                <td>0.115±0.009</td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>One Error (the lower the better)</bold>
                </td>
              </tr>
              <tr>
                <td>music-emotion</td>
                <td>
                  <bold>0.386±0.015</bold>
                </td>
                <td>0.600±0.005</td>
                <td>0.623±0.003</td>
                <td>0.587±0.005</td>
                <td>0.403±0.008</td>
                <td>0.453±0.013</td>
                <td>0.527±0.012</td>
                <td>0.453±0.022</td>
                <td>0.388±0.038</td>
              </tr>
              <tr>
                <td>music-style</td>
                <td>0.333±0.021</td>
                <td>0.403±0.021</td>
                <td>0.495±0.002</td>
                <td>0.419±0.031</td>
                <td>0.367±0.017</td>
                <td>0.341±0.019</td>
                <td>0.578±0.024</td>
                <td>0.542±0.028</td>
                <td>
                  <bold>0.291±0.025</bold>
                </td>
              </tr>
              <tr>
                <td>mirflickr</td>
                <td>0.268±0.030</td>
                <td>0.459±0.034</td>
                <td>0.269±0.005</td>
                <td>0.165±0.009</td>
                <td>0.357±0.014</td>
                <td>0.275±0.021</td>
                <td>0.547±0.025</td>
                <td>
                  <bold>0.157±0.031</bold>
                </td>
                <td>0.273±0.038</td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>Coverage (the lower the better)</bold>
                </td>
              </tr>
              <tr>
                <td>music-emotion</td>
                <td>
                  <bold>0.394±0.009</bold>
                </td>
                <td>0.568±0.015</td>
                <td>0.521±0.023</td>
                <td>0.484±0.009</td>
                <td>0.412±0.023</td>
                <td>0.408±0.025</td>
                <td>0.492±0.043</td>
                <td>0.412±0.019</td>
                <td>0.443±0.029</td>
              </tr>
              <tr>
                <td>music-style</td>
                <td>
                  <bold>0.195±0.013</bold>
                </td>
                <td>0.302±0.007</td>
                <td>0.467±0.011</td>
                <td>0.368±0.005</td>
                <td>0.213±0.012</td>
                <td>0.191±0.023</td>
                <td>0.352±0.013</td>
                <td>0.405±0.017</td>
                <td>0.256±0.021</td>
              </tr>
              <tr>
                <td>mirflickr</td>
                <td>
                  <bold>0.211±0.007</bold>
                </td>
                <td>0.285±0.009</td>
                <td>0.224±0.022</td>
                <td>0.305±0.032</td>
                <td>0.237±0.016</td>
                <td>0.235±0.032</td>
                <td>0.317±0.011</td>
                <td>0.284±0.014</td>
                <td>0.215±0.021</td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>Average Precision (the higher the better)</bold>
                </td>
              </tr>
              <tr>
                <td>music-emotion</td>
                <td>0.628±0.006</td>
                <td>0.525±0.024</td>
                <td>0.489±0.003</td>
                <td>0.542±0.007</td>
                <td>
                  <bold>0.636±0.013</bold>
                </td>
                <td>0.612±0.012</td>
                <td>0.581±0.021</td>
                <td>0.612±0.034</td>
                <td>0.596±0.009</td>
              </tr>
              <tr>
                <td>music-style</td>
                <td>
                  <bold>0.747±0.008</bold>
                </td>
                <td>0.654±0.123</td>
                <td>0.523±0.052</td>
                <td>0.621±0.073</td>
                <td>0.722±0.023</td>
                <td>0.743±0.059</td>
                <td>0.548±0.046</td>
                <td>0.580±0.037</td>
                <td>0.741±0.018</td>
              </tr>
              <tr>
                <td>mirflickr</td>
                <td>
                  <bold>0.810±0.011</bold>
                </td>
                <td>0.685±0.008</td>
                <td>0.675±0.034</td>
                <td>0.690±0.028</td>
                <td>0.768±0.028</td>
                <td>0.781±0.048</td>
                <td>0.660±0.062</td>
                <td>0.768±0.033</td>
                <td>0.805±0.017</td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>microF1 (the higher the better)</bold>
                </td>
              </tr>
              <tr>
                <td>music-emotion</td>
                <td>
                  <bold>0.489±0.022</bold>
                </td>
                <td>0.308±0.011</td>
                <td>0.294±0.006</td>
                <td>0.332±0.011</td>
                <td>0.463±0.009</td>
                <td>0.459±0.012</td>
                <td>0.287±0.029</td>
                <td>0.463±0.013</td>
                <td>0.469±0.012</td>
              </tr>
              <tr>
                <td>music-style</td>
                <td>
                  <bold>0.591±0.013</bold>
                </td>
                <td>0.401±0.017</td>
                <td>0.355±0.010</td>
                <td>0.519±0.018</td>
                <td>0.575±0.017</td>
                <td>0.552±0.029</td>
                <td>0.390±0.024</td>
                <td>0.488±0.026</td>
                <td>0.588±0.023</td>
              </tr>
              <tr>
                <td>mirflickr</td>
                <td>
                  <bold>0.701±0.026</bold>
                </td>
                <td>0.382±0.012</td>
                <td>0.582±0.013</td>
                <td>0.613±0.026</td>
                <td>0.681±0.042</td>
                <td>0.675±0.027</td>
                <td>0.543±0.031</td>
                <td>0.668±0.022</td>
                <td>0.669±0.034</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>The best performance is shown in bold (<italic>t</italic>-test at 0.05 significance). LCND: Label co-occurrence guided nonlinear disambiguation for partial multi-label learning; PML: partial multi-label learning.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
		<table-wrap id="t4">
          <label>Table 4</label>
          <caption>
            <p>Comparison of LCND with state-of-the-art PML methods on six evaluation metrics</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Data</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>LCND</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>ML-KNN</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PML-<italic>lc</italic></bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PARTICLE</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PAMB</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PML-NI</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>NATAL</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PLAIN</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PML-TF</bold>
                </td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>Hamming Loss (the lower the better)</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td>Bibtex</td>
                <td>0.014±0.002</td>
                <td>0.998±0.012</td>
                <td>0.018±0.034</td>
                <td>0.015±0.006</td>
                <td>0.024±0.018</td>
                <td>0.014±0.048</td>
                <td>0.982±0.071</td>
                <td>
                  <bold>0.012±0.037</bold>
                </td>
                <td>0.014±0.003</td>
              </tr>
              <tr>
                <td>Birds</td>
                <td>0.055±0.006</td>
                <td>0.997±0.032</td>
                <td>0.056±0.053</td>
                <td>0.164±0.027</td>
                <td>0.141±0.029</td>
                <td>0.062±0.014</td>
                <td>0.901±0.019</td>
                <td>
                  <bold>0.053±0.034</bold>
                </td>
                <td>0.121±0.046</td>
              </tr>
              <tr>
                <td>Emotions</td>
                <td>0.243±0.120</td>
                <td>0.679±0.021</td>
                <td>0.417±0.027</td>
                <td>0.251±0.041</td>
                <td>
                  <bold>0.226±0.023</bold>
                </td>
                <td>0.287±0.073</td>
                <td>0.796±0.052</td>
                <td>0.281±0.032</td>
                <td>0.263±0.037</td>
              </tr>
              <tr>
                <td>Image</td>
                <td>
                  <bold>0.182±0.017</bold>
                </td>
                <td>0.849±0.033</td>
                <td>0.213±0.031</td>
                <td>0.754±0.029</td>
                <td>0.208±0.015</td>
                <td>0.209±0.013</td>
                <td>0.826±0.018</td>
                <td>0.967±0.023</td>
                <td>0.241±0.016</td>
              </tr>
              <tr>
                <td>Medical</td>
                <td>
                  <bold>0.010±0.001</bold>
                </td>
                <td>0.984±0.071</td>
                <td>0.012±0.042</td>
                <td>0.012±0.042</td>
                <td>0.034±0.045</td>
                <td>0.012±0.017</td>
                <td>0.971±0.024</td>
                <td>0.017±0.052</td>
                <td>0.011±0.018</td>
              </tr>
              <tr>
                <td>Scene</td>
                <td>
                  <bold>0.124±0.015</bold>
                </td>
                <td>0.821±0.056</td>
                <td>0.204±0.027</td>
                <td>0.126±0.011</td>
                <td>0.308±0.031</td>
                <td>0.144±0.032</td>
                <td>0.839±0.027</td>
                <td>0.218±0.041</td>
                <td>0.221±0.024</td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>Ranking Loss (the lower the better)</bold>
                </td>
              </tr>
              <tr>
                <td>Bibtex</td>
                <td>0.112±0.005</td>
                <td>0.228±0.031</td>
                <td>0.137±0.061</td>
                <td>0.117±0.039</td>
                <td>0.331±0.036</td>
                <td>
                  <bold>0.108±0.036</bold>
                </td>
                <td>0.159±0.097</td>
                <td>0.124±0.027</td>
                <td>0.102±0.006</td>
              </tr>
              <tr>
                <td>Birds</td>
                <td>0.129±0.028</td>
                <td>0.491±0.022</td>
                <td>0.278±0.083</td>
                <td>0.175±0.043</td>
                <td>0.403±0.092</td>
                <td>0.186±0.014</td>
                <td>0.404±0.023</td>
                <td>
                  <bold>0.105±0.037</bold>
                </td>
                <td>0.405±0.021</td>
              </tr>
              <tr>
                <td>Emotions</td>
                <td>
                  <bold>0.147±0.013</bold>
                </td>
                <td>0.306±0.042</td>
                <td>0.271±0.062</td>
                <td>0.201±0.045</td>
                <td>0.225±0.015</td>
                <td>0.206±0.043</td>
                <td>0.168±0.023</td>
                <td>0.216±0.034</td>
                <td>0.152±0.045</td>
              </tr>
              <tr>
                <td>Image</td>
                <td>
                  <bold>0.166±0.011</bold>
                </td>
                <td>0.219±0.021</td>
                <td>0.245±0.075</td>
                <td>0.181±0.031</td>
                <td>0.211±0.034</td>
                <td>0.218±0.034</td>
                <td>0.246±0.037</td>
                <td>0.213±0.031</td>
                <td>0.179±0.083</td>
              </tr>
              <tr>
                <td>Medical</td>
                <td>
                  <bold>0.021±0.004</bold>
                </td>
                <td>0.048±0.083</td>
                <td>0.025±0.075</td>
                <td>0.031±0.044</td>
                <td>0.148±0.025</td>
                <td>0.032±0.032</td>
                <td>0.024±0.071</td>
                <td>0.049±0.018</td>
                <td>0.023±0.034</td>
              </tr>
              <tr>
                <td>Scene</td>
                <td>
                  <bold>0.099±0.003</bold>
                </td>
                <td>0.114±0.028</td>
                <td>0.228±0.045</td>
                <td>0.116±0.063</td>
                <td>0.714±0.042</td>
                <td>0.156±0.057</td>
                <td>0.154±0.046</td>
                <td>0.169±0.035</td>
                <td>0.124±0.025</td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>One Error (the lower the better)</bold>
                </td>
              </tr>
              <tr>
                <td>Bibtex</td>
                <td>0.351±0.012</td>
                <td>0.617±0.011</td>
                <td>0.443±0.023</td>
                <td>0.363±0.042</td>
                <td>0.854±0.032</td>
                <td>0.369±0.019</td>
                <td>0.470±0.058</td>
                <td>
                  <bold>0.088±0.035</bold>
                </td>
                <td>0.394±0.025</td>
              </tr>
              <tr>
                <td>Birds</td>
                <td>
                  <bold>0.355±0.051</bold>
                </td>
                <td>0.837±0.043</td>
                <td>0.652±0.042</td>
                <td>0.388±0.084</td>
                <td>0.584±0.064</td>
                <td>0.425±0.049</td>
                <td>0.523±0.048</td>
                <td>0.585±0.072</td>
                <td>0.474±0.023</td>
              </tr>
              <tr>
                <td>Emotions</td>
                <td>
                  <bold>0.254±0.048</bold>
                </td>
                <td>0.412±0.035</td>
                <td>0.487±0.054</td>
                <td>0.305±0.071</td>
                <td>0.389±0.035</td>
                <td>0.324±0.046</td>
                <td>0.254±0.036</td>
                <td>0.317±0.083</td>
                <td>0.284±0.043</td>
              </tr>
              <tr>
                <td>Image</td>
                <td>
                  <bold>0.301±0.024</bold>
                </td>
                <td>0.355±0.041</td>
                <td>0.455±0.031</td>
                <td>0.326±0.025</td>
                <td>0.387±0.064</td>
                <td>0.411±0.027</td>
                <td>0.426±0.024</td>
                <td>0.341±0.027</td>
                <td>0.310±0.021</td>
              </tr>
              <tr>
                <td>Medical</td>
                <td>0.147±0.018</td>
                <td>0.261±0.057</td>
                <td>
                  <bold>0.132±0.076</bold>
                </td>
                <td>0.153±0.037</td>
                <td>0.612±0.014</td>
                <td>0.151±0.066</td>
                <td>0.184±0.048</td>
                <td>0.235±0.074</td>
                <td>0.154±0.047</td>
              </tr>
              <tr>
                <td>Scene</td>
                <td>0.255±0.013</td>
                <td>
                  <bold>0.250±0.053</bold>
                </td>
                <td>0.545±0.036</td>
                <td>0.321±0.026</td>
                <td>0.876±0.021</td>
                <td>0.378±0.036</td>
                <td>0.349±0.028</td>
                <td>0.369±0.039</td>
                <td>0.237±0.084</td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>Coverage (the lower the better)</bold>
                </td>
              </tr>
              <tr>
                <td>Bibtex</td>
                <td>0.209±0.004</td>
                <td>0.824±0.033</td>
                <td>0.231±0.053</td>
                <td>0.223±0.055</td>
                <td>0.489±0.034</td>
                <td>
                  <bold>0.207±0.037</bold>
                </td>
                <td>0.685±0.054</td>
                <td>0.817±0.019</td>
                <td>0.324±0.053</td>
              </tr>
              <tr>
                <td>Birds</td>
                <td>
                  <bold>0.108±0.013</bold>
                </td>
                <td>0.418±0.053</td>
                <td>0.196±0.031</td>
                <td>0.122±0.045</td>
                <td>0.549±0.017</td>
                <td>0.142±0.034</td>
                <td>0.408±0.058</td>
                <td>0.406±0.023</td>
                <td>0.324±0.034</td>
              </tr>
              <tr>
                <td>Emotions</td>
                <td>
                  <bold>0.293±0.022</bold>
                </td>
                <td>0.377±0.031</td>
                <td>0.375±0.086</td>
                <td>0.359±0.017</td>
                <td>0.319±0.034</td>
                <td>0.352±0.021</td>
                <td>0.536±0.043</td>
                <td>0.341±0.016</td>
                <td>0.301±0.025</td>
              </tr>
              <tr>
                <td>Image</td>
                <td>
                  <bold>0.169±0.008</bold>
                </td>
                <td>0.942±0.052</td>
                <td>0.253±0.015</td>
                <td>0.203±0.044</td>
                <td>0.219±0.013</td>
                <td>0.227±0.048</td>
                <td>0.939±0.013</td>
                <td>0.449±0.033</td>
                <td>0.192±0.015</td>
              </tr>
              <tr>
                <td>Medical</td>
                <td>
                  <bold>0.042±0.004</bold>
                </td>
                <td>0.386±0.063</td>
                <td>0.046±0.029</td>
                <td>0.053±0.066</td>
                <td>0.176±0.048</td>
                <td>0.044±0.046</td>
                <td>0.219±0.038</td>
                <td>0.247±0.041</td>
                <td>0.044±0.007</td>
              </tr>
              <tr>
                <td>Scene</td>
                <td>
                  <bold>0.098±0.005</bold>
                </td>
                <td>0.651±0.156</td>
                <td>0.208±0.082</td>
                <td>0.110±0.043</td>
                <td>0.615±0.046</td>
                <td>0.146±0.044</td>
                <td>0.407±0.021</td>
                <td>0.341±0.018</td>
                <td>0.131±0.029</td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>Average Precision (the higher the better)</bold>
                </td>
              </tr>
              <tr>
                <td>Bibtex</td>
                <td>0.562±0.008</td>
                <td>0.317±0.052</td>
                <td>0.490±0.035</td>
                <td>0.560±0.091</td>
                <td>0.153±0.086</td>
                <td>
                  <bold>0.564±0.013</bold>
                </td>
                <td>0.488±0.057</td>
                <td>0.528±0.021</td>
                <td>0.517±0.023</td>
              </tr>
              <tr>
                <td>Birds</td>
                <td>
                  <bold>0.667±0.039</bold>
                </td>
                <td>0.353±0.037</td>
                <td>0.423±0.056</td>
                <td>0.415±0.021</td>
                <td>0.382±0.077</td>
                <td>0.618±0.082</td>
                <td>0.405±0.021</td>
                <td>0.404±0.081</td>
                <td>0.428±0.023</td>
              </tr>
              <tr>
                <td>Emotions</td>
                <td>
                  <bold>0.829±0.014</bold>
                </td>
                <td>0.667±0.018</td>
                <td>0.627±0.057</td>
                <td>0.779±0.024</td>
                <td>0.723±0.046</td>
                <td>0.772±0.021</td>
                <td>0.794±0.019</td>
                <td>0.754±0.035</td>
                <td>0.827±0.016</td>
              </tr>
              <tr>
                <td>Image</td>
                <td>
                  <bold>0.806±0.011</bold>
                </td>
                <td>0.758±0.063</td>
                <td>0.712±0.031</td>
                <td>0.788±0.063</td>
                <td>0.675±0.028</td>
                <td>0.739±0.018</td>
                <td>0.723±0.034</td>
                <td>0.449±0.032</td>
                <td>0.794±0.029</td>
              </tr>
              <tr>
                <td>Medical</td>
                <td>
                  <bold>0.894±0.005</bold>
                </td>
                <td>0.782±0.076</td>
                <td>0.857±0.083</td>
                <td>0.872±0.028</td>
                <td>0.490±0.052</td>
                <td>0.876±0.013</td>
                <td>0.868±0.024</td>
                <td>0.807±0.085</td>
                <td>0.886±0.023</td>
              </tr>
              <tr>
                <td>Scene</td>
                <td>0.842±0.004</td>
                <td>0.836±0.032</td>
                <td>0.650±0.028</td>
                <td>0.806±0.031</td>
                <td>0.302±0.072</td>
                <td>0.761±0.023</td>
                <td>0.776±0.027</td>
                <td>0.752±0.064</td>
                <td>
                  <bold>0.851±0.014</bold>
                </td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>microF1 (the higher the better)</bold>
                </td>
              </tr>
              <tr>
                <td>Bibtex</td>
                <td>0.422±0.011</td>
                <td>0.286±0.043</td>
                <td>0.334±0.028</td>
                <td>0.411±0.021</td>
                <td>0.306±0.054</td>
                <td>
                  <bold>0.443±0.005</bold>
                </td>
                <td>0.393±0.036</td>
                <td>0.413±0.015</td>
                <td>0.409±0.032</td>
              </tr>
              <tr>
                <td>Birds</td>
                <td>
                  <bold>0.391±0.016</bold>
                </td>
                <td>0.148±0.035</td>
                <td>0.267±0.048</td>
                <td>0.246±0.039</td>
                <td>0.217±0.029</td>
                <td>0.386±0.036</td>
                <td>0.199±0.014</td>
                <td>0.277±0.072</td>
                <td>0.331±0.045</td>
              </tr>
              <tr>
                <td>Emotions</td>
                <td>0.667±0.012</td>
                <td>0.543±0.016</td>
                <td>0.561±0.024</td>
                <td>
                  <bold>0.678±0.015</bold>
                </td>
                <td>0.578±0.038</td>
                <td>0.641±0.015</td>
                <td>0.636±0.018</td>
                <td>0.619±0.018</td>
                <td>0.635±0.037</td>
              </tr>
              <tr>
                <td>Image</td>
                <td>
                  <bold>0.612±0.026</bold>
                </td>
                <td>0.476±0.045</td>
                <td>0.526±0.053</td>
                <td>0.561±0.035</td>
                <td>0.494±0.022</td>
                <td>0.558±0.015</td>
                <td>0.510±0.018</td>
                <td>0.383±0.026</td>
                <td>0.558±0.046</td>
              </tr>
              <tr>
                <td>Medical</td>
                <td>
                  <bold>0.786±0.022</bold>
                </td>
                <td>0.558±0.032</td>
                <td>0.717±0.064</td>
                <td>0.761±0.015</td>
                <td>0.459±0.043</td>
                <td>0.747±0.055</td>
                <td>0.599±0.017</td>
                <td>0.703±0.049</td>
                <td>0.741±0.055</td>
              </tr>
              <tr>
                <td>Scene</td>
                <td>
                  <bold>0.681±0.015</bold>
                </td>
                <td>0.554±0.013</td>
                <td>0.592±0.016</td>
                <td>0.644±0.028</td>
                <td>0.355±0.032</td>
                <td>0.613±0.021</td>
                <td>0.564±0.023</td>
                <td>0.625±0.023</td>
                <td>0.602±0.012</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>The best performances are shown in bold face (<italic>r</italic> = 1, pairwise <italic>t</italic>-test at 0.05 significance level). LCND: Label co-occurrence guided nonlinear disambiguation for partial multi-label learning; PML: partial multi-label learning.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap id="t5">
          <label>Table 5</label>
          <caption>
            <p>Comparison of LCND with state-of-the-art PML methods on six evaluation metrics</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Data</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>LCND</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>ML-KNN</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PML-<italic>lc</italic></bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PARTICLE</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PAMB</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PML-NI</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>NATAL</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PLAIN</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PML-TF</bold>
                </td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>Hamming Loss (the lower the better)</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td>Bibtex</td>
                <td>0.014±0.001</td>
                <td>0.998±0.035</td>
                <td>0.019±0.025</td>
                <td>0.019±0.086</td>
                <td>0.025±0.028</td>
                <td>0.015±0.094</td>
                <td>0.986±0.036</td>
                <td>
                  <bold>0.013±0.017</bold>
                </td>
                <td>0.016±0.084</td>
              </tr>
              <tr>
                <td>Birds</td>
                <td>
                  <bold>0.059±0.003</bold>
                </td>
                <td>0.995±0.037</td>
                <td>0.063±0.012</td>
                <td>0.822±0.063</td>
                <td>0.196±0.081</td>
                <td>0.064±0.044</td>
                <td>0.907±0.022</td>
                <td>0.064±0.092</td>
                <td>0.215±0.029</td>
              </tr>
              <tr>
                <td>Emotions</td>
                <td>0.254±0.010</td>
                <td>0.706±0.048</td>
                <td>0.686±0.075</td>
                <td>0.426±0.054</td>
                <td>
                  <bold>0.232±0.072</bold>
                </td>
                <td>0.336±0.023</td>
                <td>0.803±0.053</td>
                <td>0.444±0.018</td>
                <td>0.274±0.046</td>
              </tr>
              <tr>
                <td>Image</td>
                <td>
                  <bold>0.192±0.016</bold>
                </td>
                <td>0.754±0.072</td>
                <td>0.216±0.074</td>
                <td>0.765±0.032</td>
                <td>0.265±0.018</td>
                <td>0.238±0.013</td>
                <td>0.762±0.069</td>
                <td>0.973±0.022</td>
                <td>0.261±0.025</td>
              </tr>
              <tr>
                <td>Medical</td>
                <td>
                  <bold>0.011±0.001</bold>
                </td>
                <td>0.986±0.044</td>
                <td>0.413±0.021</td>
                <td>0.015±0.045</td>
                <td>0.035±0.094</td>
                <td>0.013±0.021</td>
                <td>0.974±0.045</td>
                <td>0.017±0.045</td>
                <td>0.012±0.027</td>
              </tr>
              <tr>
                <td>Scene</td>
                <td>
                  <bold>0.127±0.013</bold>
                </td>
                <td>0.861±0.016</td>
                <td>0.343±0.038</td>
                <td>0.197±0.044</td>
                <td>0.324±0.034</td>
                <td>0.183±0.059</td>
                <td>0.845±0.023</td>
                <td>0.396±0.084</td>
                <td>0.228±0.054</td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>Ranking Loss (the lower the better)</bold>
                </td>
              </tr>
              <tr>
                <td>Bibtex</td>
                <td>0.118±0.003</td>
                <td>0.231±0.008</td>
                <td>0.179±0.061</td>
                <td>0.128±0.024</td>
                <td>0.364±0.075</td>
                <td>0.131±0.027</td>
                <td>0.168±0.056</td>
                <td>
                  <bold>0.111±0.022</bold>
                </td>
                <td>0.105±0.043</td>
              </tr>
              <tr>
                <td>Birds</td>
                <td>0.186±0.039</td>
                <td>0.473±0.034</td>
                <td>0.284±0.016</td>
                <td>0.213±0.034</td>
                <td>0.416±0.022</td>
                <td>0.187±0.011</td>
                <td>0.419±0.061</td>
                <td>
                  <bold>0.109±0.063</bold>
                </td>
                <td>0.409±0.011</td>
              </tr>
              <tr>
                <td>Emotions</td>
                <td>
                  <bold>0.179±0.024</bold>
                </td>
                <td>0.353±0.013</td>
                <td>0.392±0.039</td>
                <td>0.238±0.034</td>
                <td>0.245±0.019</td>
                <td>0.224±0.082</td>
                <td>0.245±0.022</td>
                <td>0.308±0.049</td>
                <td>0.189±0.017</td>
              </tr>
              <tr>
                <td>Image</td>
                <td>
                  <bold>0.181±0.016</bold>
                </td>
                <td>0.276±0.043</td>
                <td>0.264±0.067</td>
                <td>0.189±0.073</td>
                <td>0.338±0.042</td>
                <td>0.256±0.041</td>
                <td>0.306±0.056</td>
                <td>0.245±0.063</td>
                <td>0.182±0.037</td>
              </tr>
              <tr>
                <td>Medical</td>
                <td>
                  <bold>0.029±0.007</bold>
                </td>
                <td>0.079±0.037</td>
                <td>0.035±0.026</td>
                <td>0.042±0.018</td>
                <td>0.157±0.023</td>
                <td>0.035±0.024</td>
                <td>0.038±0.021</td>
                <td>0.073±0.028</td>
                <td>0.031±0.034</td>
              </tr>
              <tr>
                <td>Scene</td>
                <td>
                  <bold>0.110±0.006</bold>
                </td>
                <td>0.153±0.084</td>
                <td>0.259±0.052</td>
                <td>0.177±0.016</td>
                <td>0.781±0.039</td>
                <td>0.187±0.019</td>
                <td>0.214±0.038</td>
                <td>0.244±0.062</td>
                <td>0.132±0.016</td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>One Error (the lower the better)</bold>
                </td>
              </tr>
              <tr>
                <td>Bibtex</td>
                <td>0.383±0.034</td>
                <td>0.627±0.064</td>
                <td>0.443±0.041</td>
                <td>0.384±0.083</td>
                <td>0.858±0.051</td>
                <td>
                  <bold>0.376±0.029</bold>
                </td>
                <td>0.471±0.011</td>
                <td>0.437±0.073</td>
                <td>0.429±0.083</td>
              </tr>
              <tr>
                <td>Birds</td>
                <td>
                  <bold>0.431±0.029</bold>
                </td>
                <td>0.775±0.014</td>
                <td>0.662±0.019</td>
                <td>0.474±0.061</td>
                <td>0.600±0.054</td>
                <td>0.447±0.089</td>
                <td>0.571±0.024</td>
                <td>0.692±0.045</td>
                <td>0.486±0.031</td>
              </tr>
              <tr>
                <td>Emotions</td>
                <td>
                  <bold>0.318±0.026</bold>
                </td>
                <td>0.428±0.026</td>
                <td>0.554±0.091</td>
                <td>0.333±0.064</td>
                <td>0.389±0.054</td>
                <td>0.375±0.056</td>
                <td>0.407±0.086</td>
                <td>0.433±0.033</td>
                <td>0.332±0.023</td>
              </tr>
              <tr>
                <td>Image</td>
                <td>0.334±0.019</td>
                <td>0.462±0.036</td>
                <td>0.472±0.033</td>
                <td>0.347±0.043</td>
                <td>0.502±0.046</td>
                <td>0.478±0.029</td>
                <td>0.432±0.041</td>
                <td>0.389±0.042</td>
                <td>
                  <bold>0.320±0.016</bold>
                </td>
              </tr>
              <tr>
                <td>Medical</td>
                <td>
                  <bold>0.145±0.021</bold>
                </td>
                <td>0.291±0.013</td>
                <td>0.158±0.096</td>
                <td>0.198±0.091</td>
                <td>0.632±0.048</td>
                <td>0.161±0.047</td>
                <td>0.234±0.072</td>
                <td>0.296±0.082</td>
                <td>0.165±0.034</td>
              </tr>
              <tr>
                <td>Scene</td>
                <td>
                  <bold>0.279±0.000</bold>
                </td>
                <td>0.318±0.093</td>
                <td>0.555±0.048</td>
                <td>0.425±0.046</td>
                <td>0.900±0.027</td>
                <td>0.419±0.048</td>
                <td>0.389±0.083</td>
                <td>0.531±0.048</td>
                <td>0.296±0.043</td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>Coverage (the lower the better)</bold>
                </td>
              </tr>
              <tr>
                <td>Bibtex</td>
                <td>
                  <bold>0.227±0.008</bold>
                </td>
                <td>0.889±0.024</td>
                <td>0.238±0.002</td>
                <td>0.231±0.041</td>
                <td>0.505±0.084</td>
                <td>0.241±0.018</td>
                <td>0.613±0.028</td>
                <td>0.912±0.034</td>
                <td>0.591±0.032</td>
              </tr>
              <tr>
                <td>Birds</td>
                <td>
                  <bold>0.132±0.036</bold>
                </td>
                <td>0.413±0.049</td>
                <td>0.212±0.017</td>
                <td>0.156±0.051</td>
                <td>0.680±0.021</td>
                <td>0.149±0.041</td>
                <td>0.436±0.024</td>
                <td>0.449±0.046</td>
                <td>0.401±0.008</td>
              </tr>
              <tr>
                <td>Emotions</td>
                <td>
                  <bold>0.319±0.021</bold>
                </td>
                <td>0.436±0.031</td>
                <td>0.471±0.029</td>
                <td>0.394±0.073</td>
                <td>0.342±0.046</td>
                <td>0.358±0.014</td>
                <td>0.545±0.039</td>
                <td>0.453±0.028</td>
                <td>0.323±0.027</td>
              </tr>
              <tr>
                <td>Image</td>
                <td>
                  <bold>0.198±0.014</bold>
                </td>
                <td>0.947±0.041</td>
                <td>0.259±0.043</td>
                <td>0.219±0.028</td>
                <td>0.323±0.077</td>
                <td>0.255±0.037</td>
                <td>0.939±0.033</td>
                <td>0.299±0.031</td>
                <td>0.205±0.014</td>
              </tr>
              <tr>
                <td>Medical</td>
                <td>
                  <bold>0.044±0.013</bold>
                </td>
                <td>0.457±0.026</td>
                <td>0.051±0.098</td>
                <td>0.064±0.023</td>
                <td>0.201±0.016</td>
                <td>0.052±0.072</td>
                <td>0.283±0.098</td>
                <td>0.309±0.038</td>
                <td>0.048±0.039</td>
              </tr>
              <tr>
                <td>Scene</td>
                <td>
                  <bold>0.105±0.005</bold>
                </td>
                <td>0.846±0.043</td>
                <td>0.229±0.034</td>
                <td>0.163±0.037</td>
                <td>0.674±0.084</td>
                <td>0.176±0.041</td>
                <td>0.415±0.082</td>
                <td>0.451±0.057</td>
                <td>0.141±0.032</td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>Average Precision (the higher the better)</bold>
                </td>
              </tr>
              <tr>
                <td>Bibtex</td>
                <td>
                  <bold>0.551±0.008</bold>
                </td>
                <td>0.307±0.063</td>
                <td>0.482±0.049</td>
                <td>0.536±0.053</td>
                <td>0.150±0.019</td>
                <td>0.537±0.064</td>
                <td>0.485±0.048</td>
                <td>0.504±0.027</td>
                <td>0.507±0.058</td>
              </tr>
              <tr>
                <td>Birds</td>
                <td>
                  <bold>0.632±0.036</bold>
                </td>
                <td>0.316±0.073</td>
                <td>0.411±0.970</td>
                <td>0.397±0.077</td>
                <td>0.377±0.049</td>
                <td>0.587±0.049</td>
                <td>0.401±0.012</td>
                <td>0.358±0.034</td>
                <td>0.413±0.046</td>
              </tr>
              <tr>
                <td>Emotions</td>
                <td>0.784±0.014</td>
                <td>0.650±0.025</td>
                <td>0.599±0.068</td>
                <td>0.739±0.053</td>
                <td>0.714±0.047</td>
                <td>0.730±0.043</td>
                <td>0.718±0.024</td>
                <td>0.666±0.015</td>
                <td>
                  <bold>0.794±0.037</bold>
                </td>
              </tr>
              <tr>
                <td>Image</td>
                <td>
                  <bold>0.801±0.014</bold>
                </td>
                <td>0.697±0.027</td>
                <td>0.698±0.081</td>
                <td>0.775±0.074</td>
                <td>0.653±0.027</td>
                <td>0.698±0.033</td>
                <td>0.696±0.015</td>
                <td>0.406±0.046</td>
                <td>0.786±0.033</td>
              </tr>
              <tr>
                <td>Medical</td>
                <td>
                  <bold>0.892±0.023</bold>
                </td>
                <td>0.753±0.061</td>
                <td>0.839±0.019</td>
                <td>0.831±0.029</td>
                <td>0.471±0.044</td>
                <td>0.858±0.044</td>
                <td>0.805±0.076</td>
                <td>0.736±0.048</td>
                <td>0.859±0.021</td>
              </tr>
              <tr>
                <td>Scene</td>
                <td>
                  <bold>0.819±0.015</bold>
                </td>
                <td>0.793±0.042</td>
                <td>0.637±0.066</td>
                <td>0.731±0.042</td>
                <td>0.266±0.017</td>
                <td>0.731±0.017</td>
                <td>0.729±0.012</td>
                <td>0.646±0.066</td>
                <td>0.746±0.056</td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>microF1 (the higher the better)</bold>
                </td>
              </tr>
              <tr>
                <td>Bibtex</td>
                <td>0.403±0.034</td>
                <td>0.258±0.037</td>
                <td>0.388±0.035</td>
                <td>0.400±0.023</td>
                <td>0.287±0.011</td>
                <td>
                  <bold>0.410±0.009</bold>
                </td>
                <td>0.383±0.030</td>
                <td>0.399±0.017</td>
                <td>0.382±0.023</td>
              </tr>
              <tr>
                <td>Birds</td>
                <td>
                  <bold>0.367±0.018</bold>
                </td>
                <td>0.139±0.056</td>
                <td>0.250±0.067</td>
                <td>0.227±0.055</td>
                <td>0.207±0.040</td>
                <td>0.351±0.043</td>
                <td>0.177±0.022</td>
                <td>0.254±0.045</td>
                <td>0.294±0.011</td>
              </tr>
              <tr>
                <td>Emotions</td>
                <td>
                  <bold>0.643±0.011</bold>
                </td>
                <td>0.521±0.025</td>
                <td>0.536±0.041</td>
                <td>0.615±0.037</td>
                <td>0.563±0.036</td>
                <td>0.593±0.035</td>
                <td>0.605±0.025</td>
                <td>0.557±0.025</td>
                <td>0.597±0.026</td>
              </tr>
              <tr>
                <td>Image</td>
                <td>
                  <bold>0.627±0.025</bold>
                </td>
                <td>0.464±0.036</td>
                <td>0.507±0.024</td>
                <td>0.527±0.033</td>
                <td>0.489±0.019</td>
                <td>0.492±0.012</td>
                <td>0.471±0.023</td>
                <td>0.355±0.035</td>
                <td>0.585±0.021</td>
              </tr>
              <tr>
                <td>Medical</td>
                <td>
                  <bold>0.741±0.014</bold>
                </td>
                <td>0.503±0.059</td>
                <td>0.679±0.035</td>
                <td>0.701±0.023</td>
                <td>0.437±0.033</td>
                <td>0.710±0.009</td>
                <td>0.557±0.047</td>
                <td>0.647±0.032</td>
                <td>0.701±0.019</td>
              </tr>
              <tr>
                <td>Scene</td>
                <td>
                  <bold>0.648±0.012</bold>
                </td>
                <td>0.516±0.012</td>
                <td>0.576±0.034</td>
                <td>0.589±0.033</td>
                <td>0.280±0.019</td>
                <td>0.542±0.017</td>
                <td>0.528±0.018</td>
                <td>0.551±0.067</td>
                <td>0.563±0.032</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>Best performances are shown in bold face (<italic>r</italic> = 2, pairwise <italic>t</italic>-test at 0.05 significance level). LCND: Label co-occurrence guided nonlinear disambiguation for partial multi-label learning; PML: partial multi-label learning.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap id="t6">
          <label>Table 6</label>
          <caption>
            <p>Comparison of LCND with state-of-the-art PML methods on six evaluation metrics</p>
          </caption>
          <table frame="hsides" rules="groups" pdfpage="19">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Data</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>LCND</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>ML-KNN</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PML-<italic>lc</italic></bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PARTICLE</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PAMB</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PML-NI</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>NATAL</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PLAIN</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PML-TF</bold>
                </td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>Hamming Loss (lower is better)</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td>Bibtex</td>
                <td>0.015 ± 0.001</td>
                <td>0.998 ± 0.018</td>
                <td>0.019 ± 0.012</td>
                <td>0.021 ± 0.032</td>
                <td>0.025 ± 0.063</td>
                <td>0.016 ± 0.073</td>
                <td>0.987 ± 0.014</td>
                <td>
                  <bold>0.013 ± 0.072</bold>
                </td>
                <td>0.018 ± 0.094</td>
              </tr>
              <tr>
                <td>Birds</td>
                <td>
                  <bold>0.062 ± 0.005</bold>
                </td>
                <td>0.996 ± 0.035</td>
                <td>0.079 ± 0.077</td>
                <td>0.212 ± 0.042</td>
                <td>0.235 ± 0.023</td>
                <td>0.067 ± 0.047</td>
                <td>0.935 ± 0.028</td>
                <td>0.069 ± 0.027</td>
                <td>0.234 ± 0.021</td>
              </tr>
              <tr>
                <td>Emotions</td>
                <td>0.295 ± 0.033</td>
                <td>0.813 ± 0.035</td>
                <td>0.696 ± 0.018</td>
                <td>0.599 ± 0.032</td>
                <td>
                  <bold>0.257 ± 0.037</bold>
                </td>
                <td>0.557 ± 0.026</td>
                <td>0.816 ± 0.029</td>
                <td>0.533 ± 0.026</td>
                <td>0.292 ± 0.013</td>
              </tr>
              <tr>
                <td>Image</td>
                <td>
                  <bold>0.194 ± 0.006</bold>
                </td>
                <td>0.751 ± 0.058</td>
                <td>0.225 ± 0.023</td>
                <td>0.793 ± 0.022</td>
                <td>0.312 ± 0.047</td>
                <td>0.274 ± 0.065</td>
                <td>0.776 ± 0.067</td>
                <td>0.984 ± 0.036</td>
                <td>0.275 ± 0.026</td>
              </tr>
              <tr>
                <td>Medical</td>
                <td>
                  <bold>0.012 ± 0.001</bold>
                </td>
                <td>0.989 ± 0.032</td>
                <td>0.017 ± 0.081</td>
                <td>0.018 ± 0.016</td>
                <td>0.038 ± 0.012</td>
                <td>0.015 ± 0.024</td>
                <td>0.981 ± 0.041</td>
                <td>0.022 ± 0.074</td>
                <td>
                  <bold>0.012 ± 0.000</bold>
                </td>
              </tr>
              <tr>
                <td>Scene</td>
                <td>
                  <bold>0.151 ± 0.019</bold>
                </td>
                <td>0.874 ± 0.034</td>
                <td>0.733 ± 0.047</td>
                <td>0.274 ± 0.043</td>
                <td>0.353 ± 0.043</td>
                <td>0.278 ± 0.022</td>
                <td>0.858 ± 0.026</td>
                <td>0.525 ± 0.022</td>
                <td>0.265 ± 0.034</td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>Ranking Loss (lower is better)</bold>
                </td>
              </tr>
              <tr>
                <td>Bibtex</td>
                <td>0.125 ± 0.003</td>
                <td>0.243 ± 0.071</td>
                <td>0.198 ± 0.019</td>
                <td>0.136 ± 0.014</td>
                <td>0.405 ± 0.057</td>
                <td>0.141 ± 0.064</td>
                <td>0.176 ± 0.041</td>
                <td>0.127 ± 0.026</td>
                <td>
                  <bold>0.107 ± 0.076</bold>
                </td>
              </tr>
              <tr>
                <td>Birds</td>
                <td>0.214 ± 0.045</td>
                <td>0.473 ± 0.021</td>
                <td>0.323 ± 0.016</td>
                <td>0.237 ± 0.013</td>
                <td>0.479 ± 0.022</td>
                <td>0.219 ± 0.036</td>
                <td>0.441 ± 0.054</td>
                <td>
                  <bold>0.114 ± 0.055</bold>
                </td>
                <td>0.448 ± 0.064</td>
              </tr>
              <tr>
                <td>Emotions</td>
                <td>0.229 ± 0.021</td>
                <td>0.409 ± 0.029</td>
                <td>0.398 ± 0.047</td>
                <td>0.344 ± 0.014</td>
                <td>0.291 ± 0.014</td>
                <td>0.333 ± 0.077</td>
                <td>0.374 ± 0.045</td>
                <td>0.323 ± 0.047</td>
                <td>
                  <bold>0.143 ± 0.075</bold>
                </td>
              </tr>
              <tr>
                <td>Image</td>
                <td>
                  <bold>0.184 ± 0.019</bold>
                </td>
                <td>0.343 ± 0.028</td>
                <td>0.271 ± 0.033</td>
                <td>0.192 ± 0.032</td>
                <td>0.394 ± 0.017</td>
                <td>0.319 ± 0.018</td>
                <td>0.386 ± 0.071</td>
                <td>0.376 ± 0.022</td>
                <td>0.269 ± 0.052</td>
              </tr>
              <tr>
                <td>Medical</td>
                <td>
                  <bold>0.033 ± 0.006</bold>
                </td>
                <td>0.083 ± 0.063</td>
                <td>0.038 ± 0.066</td>
                <td>0.036 ± 0.024</td>
                <td>0.167 ± 0.034</td>
                <td>0.040 ± 0.024</td>
                <td>0.074 ± 0.022</td>
                <td>0.076 ± 0.017</td>
                <td>0.034 ± 0.029</td>
              </tr>
              <tr>
                <td>Scene</td>
                <td>
                  <bold>0.138 ± 0.007</bold>
                </td>
                <td>0.184 ± 0.107</td>
                <td>0.288 ± 0.045</td>
                <td>0.205 ± 0.034</td>
                <td>0.832 ± 0.038</td>
                <td>0.222 ± 0.032</td>
                <td>0.253 ± 0.076</td>
                <td>0.302 ± 0.057</td>
                <td>0.156 ± 0.038</td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>One Error (lower is better)</bold>
                </td>
              </tr>
              <tr>
                <td>Bibtex</td>
                <td>
                  <bold>0.391 ± 0.018</bold>
                </td>
                <td>0.632 ± 0.021</td>
                <td>0.455 ± 0.077</td>
                <td>0.393 ± 0.065</td>
                <td>0.859 ± 0.094</td>
                <td>0.395 ± 0.045</td>
                <td>0.509 ± 0.036</td>
                <td>0.478 ± 0.061</td>
                <td>0.442 ± 0.008</td>
              </tr>
              <tr>
                <td>Birds</td>
                <td>
                  <bold>0.453 ± 0.036</bold>
                </td>
                <td>0.736 ± 0.062</td>
                <td>0.715 ± 0.094</td>
                <td>0.533 ± 0.028</td>
                <td>0.752 ± 0.031</td>
                <td>0.493 ± 0.054</td>
                <td>0.609 ± 0.013</td>
                <td>0.754 ± 0.064</td>
                <td>0.531 ± 0.022</td>
              </tr>
              <tr>
                <td>Emotions</td>
                <td>0.351 ± 0.014</td>
                <td>0.546 ± 0.074</td>
                <td>0.579 ± 0.072</td>
                <td>0.582 ± 0.028</td>
                <td>0.407 ± 0.092</td>
                <td>0.426 ± 0.046</td>
                <td>0.455 ± 0.031</td>
                <td>0.550 ± 0.039</td>
                <td>
                  <bold>0.348 ± 0.025</bold>
                </td>
              </tr>
              <tr>
                <td>Image</td>
                <td>
                  <bold>0.331 ± 0.029</bold>
                </td>
                <td>0.562 ± 0.011</td>
                <td>0.523 ± 0.014</td>
                <td>0.369 ± 0.043</td>
                <td>0.612 ± 0.033</td>
                <td>0.509 ± 0.048</td>
                <td>0.565 ± 0.023</td>
                <td>0.415 ± 0.021</td>
                <td>0.365 ± 0.064</td>
              </tr>
              <tr>
                <td>Medical</td>
                <td>
                  <bold>0.153 ± 0.012</bold>
                </td>
                <td>0.332 ± 0.054</td>
                <td>0.194 ± 0.098</td>
                <td>0.215 ± 0.017</td>
                <td>0.653 ± 0.038</td>
                <td>0.212 ± 0.045</td>
                <td>0.288 ± 0.064</td>
                <td>0.347 ± 0.027</td>
                <td>0.195 ± 0.027</td>
              </tr>
              <tr>
                <td>Scene</td>
                <td>
                  <bold>0.309 ± 0.007</bold>
                </td>
                <td>0.384 ± 0.029</td>
                <td>0.629 ± 0.024</td>
                <td>0.463 ± 0.055</td>
                <td>0.938 ± 0.046</td>
                <td>0.502 ± 0.064</td>
                <td>0.408 ± 0.034</td>
                <td>0.585 ± 0.048</td>
                <td>0.329 ± 0.083</td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>Coverage (lower is better)</bold>
                </td>
              </tr>
              <tr>
                <td>Bibtex</td>
                <td>0.243 ± 0.003</td>
                <td>0.912 ± 0.005</td>
                <td>
                  <bold>0.242 ± 0.022</bold>
                </td>
                <td>0.251 ± 0.022</td>
                <td>0.529 ± 0.088</td>
                <td>0.253 ± 0.046</td>
                <td>0.612 ± 0.094</td>
                <td>0.928 ± 0.037</td>
                <td>0.598 ± 0.046</td>
              </tr>
              <tr>
                <td>Birds</td>
                <td>
                  <bold>0.164 ± 0.035</bold>
                </td>
                <td>0.514 ± 0.077</td>
                <td>0.297 ± 0.038</td>
                <td>0.194 ± 0.026</td>
                <td>0.789 ± 0.044</td>
                <td>0.163 ± 0.027</td>
                <td>0.495 ± 0.031</td>
                <td>0.458 ± 0.054</td>
                <td>0.487 ± 0.071</td>
              </tr>
              <tr>
                <td>Emotions</td>
                <td>0.334 ± 0.016</td>
                <td>0.474 ± 0.039</td>
                <td>0.488 ± 0.031</td>
                <td>0.444 ± 0.019</td>
                <td>0.381 ± 0.045</td>
                <td>0.459 ± 0.024</td>
                <td>0.567 ± 0.047</td>
                <td>0.576 ± 0.043</td>
                <td>
                  <bold>0.329 ± 0.014</bold>
                </td>
              </tr>
              <tr>
                <td>Image</td>
                <td>
                  <bold>0.214 ± 0.011</bold>
                </td>
                <td>0.990 ± 0.071</td>
                <td>0.268 ± 0.041</td>
                <td>0.254 ± 0.057</td>
                <td>0.389 ± 0.045</td>
                <td>0.315 ± 0.071</td>
                <td>0.954 ± 0.065</td>
                <td>0.345 ± 0.043</td>
                <td>0.239 ± 0.016</td>
              </tr>
              <tr>
                <td>Medical</td>
                <td>
                  <bold>0.055 ± 0.029</bold>
                </td>
                <td>0.456 ± 0.035</td>
                <td>0.054 ± 0.012</td>
                <td>0.095 ± 0.043</td>
                <td>0.216 ± 0.076</td>
                <td>0.056 ± 0.066</td>
                <td>0.328 ± 0.026</td>
                <td>0.359 ± 0.046</td>
                <td>0.057 ± 0.025</td>
              </tr>
              <tr>
                <td>Scene</td>
                <td>
                  <bold>0.134 ± 0.013</bold>
                </td>
                <td>0.986 ± 0.071</td>
                <td>0.261 ± 0.034</td>
                <td>0.185 ± 0.061</td>
                <td>0.715 ± 0.064</td>
                <td>0.198 ± 0.037</td>
                <td>0.466 ± 0.094</td>
                <td>0.589 ± 0.035</td>
                <td>0.159 ± 0.047</td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>Average Precision (higher is better)</bold>
                </td>
              </tr>
              <tr>
                <td>Bibtex</td>
                <td>
                  <bold>0.534 ± 0.011</bold>
                </td>
                <td>0.306 ± 0.037</td>
                <td>0.473 ± 0.042</td>
                <td>0.518 ± 0.054</td>
                <td>0.146 ± 0.029</td>
                <td>0.517 ± 0.024</td>
                <td>0.472 ± 0.034</td>
                <td>0.461 ± 0.045</td>
                <td>0.492 ± 0.035</td>
              </tr>
              <tr>
                <td>Birds</td>
                <td>
                  <bold>0.599 ± 0.042</bold>
                </td>
                <td>0.258 ± 0.034</td>
                <td>0.389 ± 0.018</td>
                <td>0.352 ± 0.061</td>
                <td>0.339 ± 0.071</td>
                <td>0.541 ± 0.018</td>
                <td>0.415 ± 0.067</td>
                <td>0.293 ± 0.035</td>
                <td>0.398 ± 0.027</td>
              </tr>
              <tr>
                <td>Emotions</td>
                <td>
                  <bold>0.754 ± 0.011</bold>
                </td>
                <td>0.595 ± 0.034</td>
                <td>0.590 ± 0.012</td>
                <td>0.608 ± 0.046</td>
                <td>0.709 ± 0.034</td>
                <td>0.662 ± 0.029</td>
                <td>0.622 ± 0.061</td>
                <td>0.621 ± 0.049</td>
                <td>0.738 ± 0.064</td>
              </tr>
              <tr>
                <td>Image</td>
                <td>
                  <bold>0.793 ± 0.027</bold>
                </td>
                <td>0.626 ± 0.081</td>
                <td>0.674 ± 0.031</td>
                <td>0.767 ± 0.051</td>
                <td>0.617 ± 0.084</td>
                <td>0.655 ± 0.014</td>
                <td>0.613 ± 0.041</td>
                <td>0.393 ± 0.048</td>
                <td>0.706 ± 0.017</td>
              </tr>
              <tr>
                <td>Medical</td>
                <td>
                  <bold>0.883 ± 0.016</bold>
                </td>
                <td>0.720 ± 0.067</td>
                <td>0.836 ± 0.097</td>
                <td>0.819 ± 0.051</td>
                <td>0.471 ± 0.037</td>
                <td>0.829 ± 0.061</td>
                <td>0.802 ± 0.024</td>
                <td>0.723 ± 0.027</td>
                <td>0.842 ± 0.027</td>
              </tr>
              <tr>
                <td>Scene</td>
                <td>0.791 ± 0.012</td>
                <td>0.720 ± 0.042</td>
                <td>0.592 ± 0.066</td>
                <td>0.701 ± 0.053</td>
                <td>0.228 ± 0.034</td>
                <td>0.678 ± 0.073</td>
                <td>
                  <bold>0.801 ± 0.073</bold>
                </td>
                <td>0.573 ± 0.021</td>
                <td>0.721 ± 0.097</td>
              </tr>
              <tr>
                <td colspan="10">
                  <bold>microF1 (higher is better)</bold>
                </td>
              </tr>
              <tr>
                <td>Bibtex</td>
                <td>0.395 ± 0.032</td>
                <td>0.247 ± 0.022</td>
                <td>0.365 ± 0.032</td>
                <td>0.379 ± 0.025</td>
                <td>0.269 ± 0.019</td>
                <td>
                  <bold>0.400 ± 0.004</bold>
                </td>
                <td>0.365 ± 0.019</td>
                <td>0.357 ± 0.041</td>
                <td>0.381 ± 0.014</td>
              </tr>
              <tr>
                <td>Birds</td>
                <td>
                  <bold>0.343 ± 0.015</bold>
                </td>
                <td>0.122 ± 0.024</td>
                <td>0.217 ± 0.019</td>
                <td>0.204 ± 0.033</td>
                <td>0.186 ± 0.056</td>
                <td>0.325 ± 0.012</td>
                <td>0.163 ± 0.024</td>
                <td>0.263 ± 0.046</td>
                <td>0.295 ± 0.017</td>
              </tr>
              <tr>
                <td>Emotions</td>
                <td>
                  <bold>0.554 ± 0.021</bold>
                </td>
                <td>0.468 ± 0.032</td>
                <td>0.492 ± 0.022</td>
                <td>0.515 ± 0.021</td>
                <td>0.492 ± 0.024</td>
                <td>0.499 ± 0.012</td>
                <td>0.496 ± 0.028</td>
                <td>0.495 ± 0.051</td>
                <td>0.551 ± 0.025</td>
              </tr>
              <tr>
                <td>Image</td>
                <td>
                  <bold>0.599 ± 0.018</bold>
                </td>
                <td>0.425 ± 0.051</td>
                <td>0.473 ± 0.031</td>
                <td>0.483 ± 0.049</td>
                <td>0.465 ± 0.052</td>
                <td>0.422 ± 0.018</td>
                <td>0.458 ± 0.032</td>
                <td>0.324 ± 0.021</td>
                <td>0.489 ± 0.038</td>
              </tr>
              <tr>
                <td>Medical</td>
                <td>
                  <bold>0.713 ± 0.009</bold>
                </td>
                <td>0.475 ± 0.048</td>
                <td>0.675 ± 0.021</td>
                <td>0.678 ± 0.019</td>
                <td>0.397 ± 0.029</td>
                <td>0.681 ± 0.017</td>
                <td>0.538 ± 0.025</td>
                <td>0.617 ± 0.015</td>
                <td>0.679 ± 0.022</td>
              </tr>
              <tr>
                <td>Scene</td>
                <td>
                  <bold>0.626 ± 0.025</bold>
                </td>
                <td>0.499 ± 0.034</td>
                <td>0.529 ± 0.047</td>
                <td>0.542 ± 0.017</td>
                <td>0.253 ± 0.024</td>
                <td>0.463 ± 0.029</td>
                <td>0.467 ± 0.031</td>
                <td>0.497 ± 0.047</td>
                <td>0.536 ± 0.036</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>The best performances are shown in bold face (<italic>r</italic> = 3, pairwise <italic>t</italic>-test at 0.05 significance level). LCND: Label co-occurrence guided nonlinear disambiguation for partial multi-label learning; PML: partial multi-label learning.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>To verify the effectiveness of LCND in real-world scenarios, we conducted experiments on the <italic>music_emotion</italic>, <italic>music_style</italic>, and <italic>mirflickr</italic> datasets. Among the eight compared algorithms, PAMB outperforms LCND in terms of Hamming loss on the real-world PML dataset because it adopts a binary decomposition strategy, which can improve the overall proportion of correctly predicted labels on a small portion of the data. However, its performance degrades noticeably on other datasets due to limited robustness to label noise. According to global statistical results for the Hamming loss metric, the overall performance of PAMB is inferior to that of LCND. In the remaining experimental settings, LCND consistently achieves the best or near-best results.</p>
        <p>Additionally, this study employs the Friedman test<sup>[<xref ref-type="bibr" rid="B68">68</xref>]</sup> to evaluate the comparative efficacy of the methods under review and to determine whether there is a statistically significant difference in their generalization capabilities. Let <italic>k</italic> be the number of methods being compared and <italic>N</italic> the total number of datasets used. Let <italic>r<sub>i</sub><sup>j</sup></italic> denote the rank of the <italic>j</italic>-th method on the <italic>i</italic>-th dataset. For the Friedman test, the mean rank of each method is computed as <italic>R<sub>j</sub></italic> = <inline-formula><tex-math id="M1">$$ \frac{1}{N} $$</tex-math></inline-formula>Σ<italic><sub>i</sub></italic><sub>=1</sub><italic><sup>N</sup></italic><italic>r<sub>i</sub><sup>j</sup></italic> (1 ≤ <italic>j</italic> ≤ <italic>k</italic>). Assuming the null hypothesis that the generalization performance of all evaluated methods is equivalent, the Friedman statistic <italic>F<sub>F</sub></italic> is defined and follows an F-distribution with <italic>k</italic>-1 and (<italic>k</italic>-1)(<italic>N</italic>-1) degrees of freedom:</p>
        <p><disp-formula> <label>(34)</label> <tex-math id="E1"> $$  F_{F}=\frac{(N-1)\chi_{F}^{2}}{N(k-1)-\chi_{F}^{2}} $$ </tex-math></disp-formula></p>
        <p>where,</p>
        <p><disp-formula> <label>(35)</label> <tex-math id="E1"> $$  \chi_{F}^{2}=\frac{12 N}{k(k+1)}\left[\sum_{j=1}^{k} R_{j}^{2}-\frac{k(k+1)^{2}}{4}\right] $$ </tex-math></disp-formula></p>
        <p>
          <xref ref-type="table" rid="t7">Table 7</xref> summarizes the Friedman statistics <italic>F<sub>F</sub></italic> and the critical values for the six evaluation criteria (number of compared algorithms <italic>k</italic> = 9, number of datasets <italic>N</italic> = 21). Based on <xref ref-type="table" rid="t7">Table 7</xref>, the null hypothesis that there is no significant performance difference among the compared methods can be rejected at the 0.05 significance level.</p>
        <table-wrap id="t7">
          <label>Table 7</label>
          <caption>
            <p>Friedman test statistics <italic>F<sub>F</sub></italic> for individual assessment metrics and corresponding critical values at the 0.05 significance level (number of compared algorithms <italic>k</italic> = 9, number of data sets <italic>N</italic> = 21)</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Evaluation metric</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>
                    <italic>F<sub>F</sub></italic>
                  </bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Critical value (0.05)</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td>Hamming Loss</td>
                <td>28.987</td>
                <td />
              </tr>
              <tr>
                <td>Ranking Loss</td>
                <td>22.760</td>
                <td />
              </tr>
              <tr>
                <td>One Error</td>
                <td>19.948</td>
                <td />
              </tr>
              <tr>
                <td>Coverage</td>
                <td>37.887</td>
                <td>2.302</td>
              </tr>
              <tr>
                <td>Average Precision</td>
                <td>29.420</td>
                <td />
              </tr>
              <tr>
                <td>microF1</td>
                <td>35.928</td>
                <td />
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <p>In addition, we apply the Bonferroni-Dunn test<sup>[<xref ref-type="bibr" rid="B68">68</xref>]</sup> to further investigate the performance differences among the eight compared algorithms. LCND serves as the benchmark method, and its average rank difference relative to the other methods is measured by the critical difference (CD). We consider the performance difference between LCND and another method to be significant if their mean rank difference exceeds the CD threshold (in this study, CD is set to 2.302, with <italic>k</italic> = 9 algorithms and <italic>N</italic> = 21 datasets). The CD analysis for each metric is shown in <xref ref-type="fig" rid="fig1">Figure 1</xref>. In this figure, the average ranks of the seven methods are plotted, with the best (i.e., smallest) ranks placed on the far right. A bold line connects LCND to a compared method if their average rank difference falls within the CD range.</p>
        <fig id="fig1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>LCND compared with eight algorithms using Bonferroni-Dunn test. If not linked on CD diagram, performance differs significantly (CD = 2.302, 0.05 significance). LCND: Label co-occurrence guided nonlinear disambiguation for partial multi-label learning; CD: critical difference.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="ir6019.fig.1.jpg" />
        </fig>
        <p>From <xref ref-type="fig" rid="fig1">Figure 1</xref>, we can observe that:</p>
        <p>• LCND achieves the best average ranking across all evaluation metrics. As shown in <xref ref-type="fig" rid="fig1">Figure 1</xref>, LCND consistently occupies the rightmost position in the CD diagram for all six metrics, including Hamming loss, Ranking loss, One error, Coverage, Average precision, and microF1. This indicates that LCND outperforms the seven competing algorithms in both error-based and accuracy-based evaluations, demonstrating strong robustness and generalizability.</p>
        <p>• LCND is statistically significantly superior to most baseline methods. With a CD threshold of CD = 2.302 at the 0.05 significance level, algorithms that are not connected by a horizontal bar are considered significantly different. LCND is not comparable to the majority of the competing methods (e.g., ML-KNN, PML-lc, PARTICLE, NATAL, PLAIN, PML-TF) on most metrics, confirming that its performance advantage is statistically significant.</p>
        <p>• The performance improvement of LCND is most pronounced on ranking-oriented metrics. The gap between LCND and the competing methods is particularly large for Ranking loss and Average precision. This demonstrates that the weighted Jaccard label affinity and nonlinear kernel mapping effectively capture fine-grained label semantics, enabling LCND to better distinguish ground-truth labels from noisy candidates during label ranking.</p>
        <p>• LCND achieves a notably better average rank than the recent transformer-based method PML-TF, especially on ranking-oriented metrics, confirming the advantage of explicit nonlinear kernel modeling over implicit deep feature extraction in PML tasks.</p>
      </sec>
      <sec id="sec4-4">
        <title>4.4. Ablation study</title>
        <p>To assess the contribution of key model components, we conduct an ablation study in which we systematically remove these components to observe the resulting changes in performance. The specific configurations for this ablation analysis are outlined below:</p>
        <p>• To validate the effectiveness of the nonlinear component <bold>P</bold> in our model, we perform an ablation analysis by removing this component and evaluating the subsequent performance changes. Specifically, we remove the module <italic>g</italic>(<bold>P</bold>) <inline-formula><tex-math id="M1">$$ \triangleq \sum_{i=1}^n\sqrt{\mathbf{p}_i^T\mathbf{Kp}_i}  $$</tex-math></inline-formula> by directly using the linear LRR formulation in Equation (2). The objective function then becomes:</p>
        <p><disp-formula> <label>(36)</label> <tex-math id="E1"> $$  \begin{aligned}&amp;\min_{\mathbf{W},\mathbf{Z},\mathbf{E}}\|\mathbf{Z}\|_*+\lambda\|\mathbf{E}\|_{2,1}+\frac12\|\mathbf{Y}-\mathbf{W}\mathbf{X}\mathbf{Z}\|_F^2+\alpha\left\|\mathbf{Z}\circ\mathbf{H}\right\|_1^2\\
				&amp;+\beta\|\mathbf{W}\|_F^2\\&amp;\mathrm{~~s.t.~}\mathbf{X}=\mathbf{X Z}+\mathbf{E}\end{aligned} $$ </tex-math></disp-formula></p>
        <p>We refer to this method as LCND-NOK and solve the optimization problem using the ALM method.</p>
        <p>• To demonstrate the impact of label affinity, we remove the term <italic>α</italic>||<bold>Z</bold>○<bold>H</bold>||<sub>1</sub><sup>2</sup>, which is a constraint in LCND, resulting in a modified method called LCND-NOH.</p>
        <p>• To assess the combined influence of the nonlinear component and label affinity, we exclude the label affinity component from the formulation in Equation (36), yielding a variant of the method termed LCND-NOKH.</p>
        <p>
          <xref ref-type="fig" rid="fig2">Figure 2</xref> presents the comparative experimental results of three methods on the <italic>music_style</italic>, <italic>Birds_3</italic>, and <italic>Medical_3</italic> datasets, where average precision is shown as one minus the average precision (i.e., 1 - Average Precision). Key observations are as follows:</p>
        <fig id="fig2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Performance of LCND-NOH, LCND-NOK, LCND-NOKH and LCND. LCND: Label co-occurrence guided nonlinear disambiguation for partial multi-label learning.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="ir6019.fig.2.jpg" />
        </fig>
        <p>• The LCND model outperforms the other methods on all datasets and most metrics, particularly in reducing <italic>One Error</italic> and improving <italic>1 - Average Precision</italic>. The LCND-NOKH model, which lacks both the nonlinear component and label affinity, underperforms compared to LCND-NOK and LCND-NOH. This indicates that jointly modeling label correlations and nonlinear feature structures is essential for achieving optimal performance.</p>
        <p>• LCND-NOK performs well on some metrics by modeling features in linear subspaces, but it does not outperform the full model. On the <italic>Medical_3</italic> dataset, where the feature dimension is larger than the number of instances (<italic>d</italic> &gt; <italic>n</italic>), the need to handle nonlinear problems becomes evident. These results confirm that nonlinear feature induction and label relationships improve training. Our ablation study demonstrates the superior performance and reliability of the complete model.</p>
      </sec>
      <sec id="sec4-5">
        <title>4.5. Comparison of different kernel functions</title>
        <p>To validate the effectiveness and generality of different kernel functions, this section presents comparative experiments using the polynomial, Sigmoid, arctan, and Gaussian kernels on both real-world and synthetic datasets. The results are summarized in <xref ref-type="fig" rid="fig3">Figure 3</xref>.</p>
        <fig id="fig3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>The comparative results of different kernel functions.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="ir6019.fig.3.jpg" />
        </fig>
        <p>As shown in <xref ref-type="fig" rid="fig3">Figure 3</xref>, the Gaussian kernel function significantly outperforms all other kernels across all six performance metrics. This superiority stems from the inherent mechanism of the Gaussian kernel: it embeds sample data into an infinite-dimensional RKHS via implicit feature mapping. This property theoretically enables the Gaussian kernel to approximate arbitrarily complex nonlinear decision boundaries, demonstrating exceptional versatility in addressing nonlinear classification problems.</p>
      </sec>
      <sec id="sec4-6">
        <title>4.6. Comparison of different label functions</title>
        <p>To rigorously verify the effectiveness of the proposed weighted Jaccard distance, we conducted additional ablation experiments comparing three variants of label similarity metrics:<break/>1. LCND-H: LCND using the standard Jaccard similarity (i.e., with equal label weights).<break/>2. LCND-CH: LCND using the cosine similarity between label vectors.</p>
        <p>The experiments were performed on three representative datasets with distinct characteristics: <italic>music_emotion</italic>, <italic>Medical_3</italic>, and <italic>Birds_2</italic>. The results are shown in <xref ref-type="fig" rid="fig4">Figure 4</xref>, from which we make the following observations:</p>
        <fig id="fig4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Performance of LCND-H, LCND-CH and LCND. LCND: Label co-occurrence guided nonlinear disambiguation for partial multi-label learning.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="ir6019.fig.4.jpg" />
        </fig>
        <p>1. The weighted Jaccard distance consistently outperforms the standard Jaccard distance. On all three datasets, LCND achieves significantly higher average precision than LCND-H. This improvement arises because the standard Jaccard distance treats all labels equally and cannot distinguish frequent labels from rare, specific, or noisy ones. In contrast, the proposed weighting scheme adaptively enhances the contribution of informative labels while suppressing the influence of noisy or trivial labels.</p>
        <p>2. The weighted Jaccard distance also outperforms the cosine similarity. LCND-CH yields the lowest average precision across all datasets. Cosine similarity computed directly on binary label vectors is highly sensitive to the sparsity and label noise in the candidate label sets of PML. In comparison, the weighted Jaccard distance incorporates global label statistics (i.e., label frequency and co-occurrence) and is more robust to random label noise.</p>
        <p>These findings demonstrate that the proposed weighted Jaccard distance is a critical component for robust label disambiguation in PML. The weighting scheme effectively leverages global label statistics to mitigate the adverse effects of label noise and sparsity, achieving consistent and significant performance improvements over both the standard Jaccard distance and the cosine similarity.</p>
      </sec>
      <sec id="sec4-7">
        <title>4.7. Parameter analysis</title>
        <p>Within the scope of this study, we consider four regularization parameters: <italic>α</italic>, <italic>β</italic>, <italic>γ</italic>, and <italic>λ</italic>. These parameters are selected from the interval [10<sup>-3</sup>, 10<sup>3</sup>] using a grid search strategy. To investigate its impact, we present experimental results of the LCND classifier by adjusting one parameter at a time while keeping the other three fixed. The data in <xref ref-type="fig" rid="fig5">Figures 5</xref> and <xref ref-type="fig" rid="fig6">6</xref> indicate that the overall trends of <italic>α</italic> and <italic>γ</italic> remain stable across different datasets. The <italic>λ</italic> parameter is also stable except for the extremely small value of 10<sup>-3</sup>. The <italic>β</italic> parameter first increases and then decreases as its value increases, with the optimal parameter range consistently falling between 1 and 10 across all datasets.</p>
        <fig id="fig5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>The performance of LCND on the <italic>mirflickr</italic> dataset across a range of trade-off parameter values. LCND: Label co-occurrence guided nonlinear disambiguation for partial multi-label learning.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="ir6019.fig.5.jpg" />
        </fig>
        <fig id="fig6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>The performance of LCND on the <italic>Medical_1</italic> dataset across a range of trade-off parameter values. LCND: Label co-occurrence guided nonlinear disambiguation for partial multi-label learning.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="ir6019.fig.6.jpg" />
        </fig>
      </sec>
      <sec id="sec4-8">
        <title>4.8. Computational complexity</title>
        <p>In the context of the LCND algorithm, <italic>T<sub>LCND</sub></italic> denotes the total number of iterations required. It is not necessary to compute the inverse (<bold>XVV</bold><italic><sup>T</sup></italic><bold>X</bold><italic><sup>T</sup> </italic>+ 2<italic>β</italic><bold>I</bold><italic><sub>d</sub></italic>)<sup>-1</sup> at every iteration; thus, computing <bold>W</bold> according to Equation (18) incurs a complexity of <inline-formula><tex-math id="M1">$$ \mathcal{O} $$</tex-math></inline-formula>(<italic>n</italic><sup>2</sup><italic>d</italic> + <italic>mdn</italic> + <italic>md</italic><sup>2</sup>). Similarly, the inverse of (<bold>WX</bold>)<italic><sup>T</sup></italic>(<bold>WX</bold>) +<italic>μ</italic><bold>I</bold> does not need to be computed iteratively, which reduces the cost of updating <bold>V</bold> as per Equation (19) to <inline-formula><tex-math id="M1">$$ \mathcal{O} $$</tex-math></inline-formula>(<italic>n</italic><sup>3</sup>). For updating <bold>J</bold>, a partial SVD approach can be used for singular value shrinkage, which has a time complexity of <inline-formula><tex-math id="M1">$$ \mathcal{O} $$</tex-math></inline-formula>(<italic>rn</italic><sup>2</sup>), where <italic>r</italic> is the rank used in the partial SVD at a given iteration. Updating <bold>Z</bold> according to Equation (22) has a complexity of <inline-formula><tex-math id="M1">$$ \mathcal{O} $$</tex-math></inline-formula>(<italic>n</italic><sup>2</sup>). The soft-thresholding operation for <bold>U</bold>, as detailed in Equation (24), also has a complexity of <inline-formula><tex-math id="M1">$$ \mathcal{O} $$</tex-math></inline-formula>(<italic>n</italic><sup>2</sup>). During the update of <bold>P</bold>, <italic>n</italic> subproblems of the form given in Equation (27) must be solved, each with a complexity of <inline-formula><tex-math id="M1">$$ \mathcal{O} $$</tex-math></inline-formula>(<italic>r<sub>X</sub></italic><sup>2</sup>) due to matrix-vector multiplications as outlined in Theorem 1, where <italic>r<sub>X</sub></italic> denotes the rank of <bold>X</bold>. The complexity of the bisection method [Equation (33)] is <inline-formula><tex-math id="M1">$$ \mathcal{O} $$</tex-math></inline-formula>(<italic>n</italic>·<italic>r</italic>·log(<inline-formula><tex-math id="M1">$$ \mathrm{\frac{high-low}{tol}}  $$</tex-math></inline-formula>)), where tol is the tolerance set to 1 × 10<sup>-4</sup>, and “low” and “high” are the lower and upper bounds. Consequently, the overall complexity of solving LCND is <inline-formula><tex-math id="M1">$$ \mathcal{O} $$</tex-math></inline-formula>(<italic>T<sub>LCND</sub></italic>((<italic>d</italic> + <italic>r</italic> + <italic>m</italic> + <italic>r<sub>X</sub></italic>)<italic>n</italic><sup>2</sup> + <italic>mdn</italic> + <italic>md</italic> + <italic>n</italic><sup>3</sup>)).</p>
        <p>We note that the label affinity matrix <bold>H</bold> constructed via the weighted Jaccard distance is highly sparse in practice. Because the candidate label sets of most instance pairs have little or no overlap, the vast majority of entries in <bold>H</bold> are either exactly zero or negligibly small. In our implementation, <bold>H</bold> can be stored in a sparse matrix format. This sparsity significantly reduces the computational cost of the element-wise product <bold>Z○H</bold> and the associated <italic>ℓ</italic><sub>1</sub> penalty. Moreover, the sparse structure of <bold>H</bold> naturally encourages sparsity in the learned instance affinity matrix <bold>Z</bold>, which in turn enables the use of scalable sparse linear algebra routines and iterative solvers, thereby avoiding full <italic>n</italic> × <italic>n</italic> matrix inversions. This sparsity-driven strategy provides a practical and effective way to extend LCND to large-scale datasets while fully preserving its nonlinear modeling capability.</p>
      </sec>
    </sec>
    <sec id="sec5">
      <title>5. CONCLUSION</title>
      <p>This paper proposes LCND, a novel framework designed to address nonlinear, partial, MLL problems. By leveraging kernel LRR, it effectively captures nonlinear data associations often overlooked by conventional linear methods, while integrating a weighted Jaccard distance to quantify label correlations and enhance label denoising. Empirical results show that LCND outperforms traditional approaches, highlighting the importance of modeling nonlinear data structures and label interconnections. This work offers a new perspective for tackling complex PML tasks. Future work will focus on extending LCND to a broader range of applications.</p>
    </sec>
  </body>
  <back>
    <sec>
      <title>DECLARATIONS</title>
      <sec>
        <title>Authors’ contributions</title>
        <p>Made substantial contributions to conception and design of the study and performed data analysis and interpretation: Song, Y.; Qi, F.; Feng, J.; Li, Z.</p>
        <p>Performed data acquisition, as well as provided administrative, technical, and material support: Huang, L.; Bu, Q.; Lu, W.; Fan, J.</p>
      </sec>
      <sec>
        <title>Availability of data and materials</title>
        <p>The Music Emotion and Music Style datasets used in this study are publicly available in the PALM Lab Partial Multi-label Learning Dataset Repository at <uri xlink:href="https://palm.seu.edu.cn/zhangml/Resources.htm">https://palm.seu.edu.cn/zhangml/Resources.htm</uri><sup>[<xref ref-type="bibr" rid="B44">44</xref>]</sup>. The Mirflickr data used in this study are publicly available in the PALM Lab Partial Multi-label Learning Dataset Repository at <uri xlink:href="https://palm.seu.edu.cn/zhangml/Resources.htm">https://palm.seu.edu.cn/zhangml/Resources.htm</uri><sup>[<xref ref-type="bibr" rid="B60">60</xref>]</sup>.<break/>The image data used in this study are publicly available in the PALM Lab Partial Multi-label Learning Dataset Repository at <uri xlink:href="https://palm.seu.edu.cn/zhangml/Resources.htm">https://palm.seu.edu.cn/zhangml/Resources.htm</uri><sup>[<xref ref-type="bibr" rid="B9">9</xref>]</sup>.<break/>The BibTex data presented in this study are available in the Mulan Multi-label Learning Dataset Repository at <uri xlink:href="https://mulan.sourceforge.net/datasets-mlc.html">https://mulan.sourceforge.net/datasets-mlc.html</uri><sup>[<xref ref-type="bibr" rid="B61">61</xref>]</sup>.<break/>The birds’ data presented in this study are available in Mulan Multi-label Learning Dataset Repository at <uri xlink:href="https://mulan.sourceforge.net/datasets-mlc.html">https://mulan.sourceforge.net/datasets-mlc.html</uri><sup>[<xref ref-type="bibr" rid="B62">62</xref>]</sup>.<break/>The emotions data presented in this study are available in Mulan Multi-label Learning Dataset Repository at <uri xlink:href="https://mulan.sourceforge.net/datasets-mlc.html">https://mulan.sourceforge.net/datasets-mlc.html</uri><sup>[<xref ref-type="bibr" rid="B63">63</xref>]</sup>.<break/>The medical data presented in this study are available in Mulan Multi-label Learning Dataset Repository at <uri xlink:href="https://mulan.sourceforge.net/datasets-mlc.html">https://mulan.sourceforge.net/datasets-mlc.html</uri><sup>[<xref ref-type="bibr" rid="B64">64</xref>]</sup>.<break/>The scene data presented in this study are available in Mulan Multi-label Learning Dataset Repository at <uri xlink:href="https://mulan.sourceforge.net/datasets-mlc.html">https://mulan.sourceforge.net/datasets-mlc.html</uri><sup>[<xref ref-type="bibr" rid="B8">8</xref>]</sup>.</p>
      </sec>
      <sec>
        <title>AI and AI-assisted tools statement</title>
        <p>Not applicable.</p>
      </sec>
      <sec>
        <title>Financial support and sponsorship</title>
        <p>This research was supported by the National Natural Science Foundation of China (under Project No. 62401309), the Natural Science Foundation of Shandong Province (under Project No. ZR2024QF119), the Qingdao Natural Science Foundation Project (under Project No. 24-4-4-zrjj-89-jch), the China Postdoctoral Science Foundation (under Project No. 2025M771692), the Open Fund Project of Key Laboratory of Computing Power Internet and Information Security, Ministry of Education (under Project No. 2024PY030), and the National Natural Science Foundation of China (under Project No. 62376130).</p>
      </sec>
      <sec>
        <title>Conflicts of interest</title>
        <p>All authors declared that there are no conflicts of interest.</p>
      </sec>
      <sec>
        <title>Ethical approval and consent to participate</title>
        <p>Not applicable.</p>
      </sec>
      <sec>
        <title>Consent for publication</title>
        <p>Not applicable.</p>
      </sec>
      <sec>
        <title>Copyright</title>
        <p>© The Author(s) 2026.</p>
      </sec>
	  <sec sec-type="supplementary-material">
      <title>Supplementary Materials</title>
          <supplementary-material content-type="local-data">
                <media xlink:href="ir6019-SupplementaryMaterials.pdf" mimetype="application/pdf">
                        <caption>
                                <p>Supplementary Materials</p>
                        </caption>
                </media>
          </supplementary-material>

          </sec>
    </sec>
    <ref-list>
      <ref id="B1">
        <label>1</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>ML</given-names>
            </name>
            <name>
              <surname>Zhou</surname>
              <given-names>ZH</given-names>
            </name>
          </person-group>
          <article-title>A review on multi-label learning algorithms</article-title>
          <source>IEEE Trans Knowl Data Eng</source>
          <year>2014</year>
          <volume>26</volume>
          <fpage>1819</fpage>
          <lpage>37</lpage>
          <pub-id pub-id-type="doi">10.1109/TKDE.2013.39</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B2">
        <label>2</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Qian</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Xiong</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Ding</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Huang</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Vong</surname>
              <given-names>CM</given-names>
            </name>
          </person-group>
          <article-title>Label correlations-based multi-label feature selection with label enhancement</article-title>
          <source>Eng Appl Artif Intell</source>
          <year>2024</year>
          <volume>127</volume>
          <fpage>107310</fpage>
          <pub-id pub-id-type="doi">10.1016/j.engappai.2023.107310</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B3">
        <label>3</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Fu</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Zhong</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Graph relationship-driven label coded mapping and compensation for multi-label textile fiber recognition</article-title>
          <source>Eng Appl Artif Intell</source>
          <year>2024</year>
          <volume>133</volume>
          <fpage>108484</fpage>
          <pub-id pub-id-type="doi">10.1016/j.engappai.2024.108484</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B4">
        <label>4</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>P</given-names>
            </name>
            <name>
              <surname>Gao</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Hu</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>A conditional-weight joint relevance metric for feature relevancy term</article-title>
          <source>Eng Appl Artif Intell</source>
          <year>2021</year>
          <volume>106</volume>
          <fpage>104481</fpage>
          <pub-id pub-id-type="doi">10.1016/j.engappai.2021.104481</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B5">
        <label>5</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Han</surname>
              <given-names>Q</given-names>
            </name>
            <name>
              <surname>Hu</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Gao</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Feature relevance and redundancy coefficients for multi-view multi-label feature selection</article-title>
          <source>Inf Sci</source>
          <year>2024</year>
          <volume>652</volume>
          <fpage>119747</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ins.2023.119747</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B6">
        <label>6</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Mu</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Sun</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Wan</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Tao</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Classifier enhancement based on credible sample selection for partial multi-label learning</article-title>
          <source>Appl Intell</source>
          <year>2025</year>
          <volume>55</volume>
          <fpage>1006</fpage>
          <pub-id pub-id-type="doi">10.1007/s10489-025-06769-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B7">
        <label>7</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Xie</surname>
              <given-names>MK</given-names>
            </name>
            <name>
              <surname>Huang</surname>
              <given-names>SJ</given-names>
            </name>
          </person-group>
          <article-title>Partial multi-label learning</article-title>
          <source>Proc AAAI Conf Artif Intell</source>
          <year>2018</year>
          <volume>32</volume>
          <pub-id pub-id-type="doi">10.1609/aaai.v32i1.11644</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B8">
        <label>8</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Boutell</surname>
              <given-names>MR</given-names>
            </name>
            <name>
              <surname>Luo</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Shen</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Brown</surname>
              <given-names>CM</given-names>
            </name>
          </person-group>
          <article-title>Learning multi-label scene classification</article-title>
          <source>Pattern Recogn</source>
          <year>2004</year>
          <volume>37</volume>
          <fpage>1757</fpage>
          <lpage>71</lpage>
          <pub-id pub-id-type="doi">10.1016/j.patcog.2004.03.009</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B9">
        <label>9</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>ML</given-names>
            </name>
            <name>
              <surname>Zhou</surname>
              <given-names>ZH</given-names>
            </name>
          </person-group>
          <article-title>ML-KNN: a lazy learning approach to multi-label learning</article-title>
          <source>Pattern Recogn</source>
          <year>2007</year>
          <volume>40</volume>
          <fpage>2038</fpage>
          <lpage>48</lpage>
          <pub-id pub-id-type="doi">10.1016/j.patcog.2006.12.019</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B10">
        <label>10</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Chen</surname>
              <given-names>YN</given-names>
            </name>
            <name>
              <surname>Lin</surname>
              <given-names>HT</given-names>
            </name>
          </person-group>
          <comment>Feature-aware label space dimension reduction for multi-label classification. 2012. <uri xlink:href="https://proceedings.neurips.cc/paper/2012/file/d4c2e4a3297fe25a71d030b67eb83bfc-Paper.pdf">https://proceedings.neurips.cc/paper/2012/file/d4c2e4a3297fe25a71d030b67eb83bfc-Paper.pdf</uri>. (accessed 2026-06-26)</comment>
        </nlm-citation>
      </ref>
      <ref id="B11">
        <label>11</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Jiang</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Tian</surname>
              <given-names>N</given-names>
            </name>
            <name>
              <surname>Wu</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Label noise correction for crowdsourcing using dynamic resampling</article-title>
          <source>Eng Appl Artif Intell</source>
          <year>2024</year>
          <volume>133</volume>
          <fpage>108439</fpage>
          <pub-id pub-id-type="doi">10.1016/j.engappai.2024.108439</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B12">
        <label>12</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Sun</surname>
              <given-names>F</given-names>
            </name>
            <name>
              <surname>Xie</surname>
              <given-names>MK</given-names>
            </name>
            <name>
              <surname>Huang</surname>
              <given-names>SJ</given-names>
            </name>
          </person-group>
          <article-title>A deep model for partial multi-label image classification with curriculum-based disambiguation</article-title>
          <source>Mach Intell Res</source>
          <year>2024</year>
          <volume>21</volume>
          <fpage>801</fpage>
          <lpage>14</lpage>
          <pub-id pub-id-type="doi">10.1007/s11633-023-1439-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B13">
        <label>13</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Sun</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Feng</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Lang</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Jin</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Partial multi-label learning by low-rank and sparse decomposition</article-title>
          <source>Proc AAAI Conf Artif Intell</source>
          <year>2019</year>
          <volume>33</volume>
          <fpage>5016</fpage>
          <lpage>23</lpage>
          <pub-id pub-id-type="doi">10.1609/aaai.v33i01.33015016</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B14">
        <label>14</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Sun</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Feng</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Lyu</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Lang</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Global-local label correlation for partial multi-label learning</article-title>
          <source>IEEE Trans Multimedia</source>
          <year>2021</year>
          <volume>24</volume>
          <fpage>581</fpage>
          <lpage>93</lpage>
          <pub-id pub-id-type="doi">10.1109/TMM.2021.3055959</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B15">
        <label>15</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Xie</surname>
              <given-names>MK</given-names>
            </name>
            <name>
              <surname>Huang</surname>
              <given-names>SJ</given-names>
            </name>
          </person-group>
          <article-title>Partial multi-label learning with noisy label identification</article-title>
          <source>IEEE Trans Pattern Anal Mach Intell</source>
          <year>2022</year>
          <volume>44</volume>
          <fpage>3676</fpage>
          <lpage>87</lpage>
          <pub-id pub-id-type="doi">10.1109/TPAMI.2021.3059290</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B16">
        <label>16</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Liu</surname>
              <given-names>BQ</given-names>
            </name>
            <name>
              <surname>Jia</surname>
              <given-names>BB</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>ML</given-names>
            </name>
          </person-group>
          <article-title>Towards enabling binary decomposition for partial multi-label learning</article-title>
          <source>IEEE Trans Pattern Anal Mach Intell</source>
          <year>2023</year>
          <volume>45</volume>
          <fpage>13203</fpage>
          <lpage>17</lpage>
          <pub-id pub-id-type="doi">10.1109/TPAMI.2023.3290797</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B17">
        <label>17</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>P</given-names>
            </name>
            <name>
              <surname>Gao</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Hu</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Multi-label feature selection based on high-order label correlation assumption</article-title>
          <source>Entropy</source>
          <year>2020</year>
          <volume>22</volume>
          <fpage>797</fpage>
          <pub-id pub-id-type="doi">10.3390/e22070797</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B18">
        <label>18</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Liu</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Lin</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Yu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <comment>Robust subspace segmentation by low-rank representation. In <italic>Proceedings of the 27th International Conference on Machine Learning (ICML-10)</italic>. Omnipress: 2010; pp. 663-70.</comment>
          <pub-id pub-id-type="doi">10.5555/3104322.3104407</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B19">
        <label>19</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Jiang</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Qi</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Dai</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>Robust subspace segmentation via nonconvex low rank representation</article-title>
          <source>Inf Sci</source>
          <year>2016</year>
          <volume>340-1</volume>
          <fpage>144</fpage>
          <lpage>58</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ins.2015.12.038</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B20">
        <label>20</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Xiao</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Tan</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Xu</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Dong</surname>
              <given-names>ZY</given-names>
            </name>
          </person-group>
          <article-title>Robust kernel low-rank representation</article-title>
          <source>IEEE Trans Neural Netw Learn Syst</source>
          <year>2016</year>
          <volume>27</volume>
          <fpage>2268</fpage>
          <lpage>81</lpage>
          <pub-id pub-id-type="doi">10.1109/TNNLS.2015.2472284</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B21">
        <label>21</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Tang</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Lu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Robust structured subspace learning for data representation</article-title>
          <source>IEEE Trans Pattern Anal Mach Intell</source>
          <year>2015</year>
          <volume>37</volume>
          <fpage>2085</fpage>
          <lpage>98</lpage>
          <pub-id pub-id-type="doi">10.1109/TPAMI.2015.2400461</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B22">
        <label>22</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Tanfous</surname>
              <given-names>AB</given-names>
            </name>
            <name>
              <surname>Drira</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Amor</surname>
              <given-names>BB</given-names>
            </name>
          </person-group>
          <article-title>Sparse coding of shape trajectories for facial expression and action recognition</article-title>
          <source>IEEE Trans Pattern Anal Mach Intell</source>
          <year>2020</year>
          <volume>42</volume>
          <fpage>2594</fpage>
          <lpage>607</lpage>
          <pub-id pub-id-type="doi">10.1109/TPAMI.2019.2932979</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B23">
        <label>23</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Roweis</surname>
              <given-names>ST</given-names>
            </name>
            <name>
              <surname>Saul</surname>
              <given-names>LK</given-names>
            </name>
          </person-group>
          <article-title>Nonlinear dimensionality reduction by locally linear embedding</article-title>
          <source>Science</source>
          <year>2000</year>
          <volume>290</volume>
          <fpage>2323</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1126/science.290.5500.2323</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B24">
        <label>24</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Abdolali</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Gillis</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Beyond linear subspace clustering: a comparative study of nonlinear manifold clustering algorithms</article-title>
          <source>Comput Sci Rev</source>
          <year>2021</year>
          <volume>42</volume>
          <fpage>100435</fpage>
          <pub-id pub-id-type="doi">10.1016/j.cosrev.2021.100435</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B25">
        <label>25</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Fang</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Chen</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>An adaptive class prototype generation framework for partial label learning</article-title>
          <source>Eng Appl Artif Intell</source>
          <year>2024</year>
          <volume>133</volume>
          <fpage>108178</fpage>
          <pub-id pub-id-type="doi">10.1016/j.engappai.2024.108178</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B26">
        <label>26</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Li</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Fan</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Shao</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Song</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Generalized contrastive partial label learning for cross-subject EEG-based emotion recognition</article-title>
          <source>IEEE Trans Instrum Meas</source>
          <year>2024</year>
          <volume>73</volume>
          <fpage>1</fpage>
          <lpage>11</lpage>
          <pub-id pub-id-type="doi">10.1109/TIM.2024.3398103</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B27">
        <label>27</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Fan</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Yu</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Partial label learning with competitive learning graph neural network</article-title>
          <source>Eng Appl Artif Intell</source>
          <year>2022</year>
          <volume>111</volume>
          <fpage>104779</fpage>
          <pub-id pub-id-type="doi">10.1016/j.engappai.2022.104779</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B28">
        <label>28</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Feng</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>An</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <comment>Partial label learning by semantic difference maximization. In <italic>Proceedings of the Twenty-Eighth International Joint Conference on Artificial Intelligence</italic>. 2019; pp. 2294-300.</comment>
          <pub-id pub-id-type="doi">10.24963/ijcai.2019/318</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B29">
        <label>29</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Liu</surname>
              <given-names>LP</given-names>
            </name>
            <name>
              <surname>Dietterich</surname>
              <given-names>TG</given-names>
            </name>
          </person-group>
          <comment>A conditional multinomial mixture model for superset label learning. In <italic>Proceedings of the 26th International Conference on Neural Information Processing Systems</italic>. Curran Associates Inc.: 2012; pp. 548-56.</comment>
          <pub-id pub-id-type="doi">10.5555/2999134.2999196</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B30">
        <label>30</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Cour</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Sapp</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Taskar</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Learning from partial labels</article-title>
          <source>J Mach Learn Res</source>
          <year>2011</year>
          <volume>12</volume>
          <fpage>1501</fpage>
          <lpage>36</lpage>
		  <comment><uri xlink:href="https://jmlr.csail.mit.edu/papers/v12/cour11a.html">https://jmlr.csail.mit.edu/papers/v12/cour11a.html</uri>. (accessed 2026-06-26)</comment>
        </nlm-citation>
      </ref>
      <ref id="B31">
        <label>31</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Gong</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Tang</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Yang</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Yang</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Tao</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>A regularization approach for instance-based superset label learning</article-title>
          <source>IEEE Trans Cybern</source>
          <year>2018</year>
          <volume>48</volume>
          <fpage>967</fpage>
          <lpage>78</lpage>
          <pub-id pub-id-type="doi">10.1109/TCYB.2017.2669639</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B32">
        <label>32</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Gong</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Yang</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Yuan</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Bao</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Generalized large margin <italic>k</italic>NN for partial label learning</article-title>
          <source>IEEE Trans Multimedia</source>
          <year>2021</year>
          <volume>24</volume>
          <fpage>1055</fpage>
          <lpage>66</lpage>
          <pub-id pub-id-type="doi">10.1109/TMM.2021.3109438</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B33">
        <label>33</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Sun</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Min</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <comment>PP-PLL: probability propagation for partial label learning. In <italic>Machine Learning and Knowledge Discovery in Databases: European Conference, ECML PKDD 2019</italic>, Würzburg, Germany, September 16-20, 2019; Springer; 2020; pp. 123-37.</comment>
          <pub-id pub-id-type="doi">10.1007/978-3-030-46147-8_8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B34">
        <label>34</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>ML</given-names>
            </name>
          </person-group>
          <comment>Partial label learning with discrimination augmentation. In <italic>Proceedings of the 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining</italic>. Association for Computing Machinery: 2022; pp. 1920-8.</comment>
          <pub-id pub-id-type="doi">10.1145/3534678.3539363</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B35">
        <label>35</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Lyu</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Feng</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Huang</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Dai</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Chen</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Partial label learning via low-rank representation and label propagation</article-title>
          <source>Soft Comput</source>
          <year>2020</year>
          <volume>24</volume>
          <fpage>5165</fpage>
          <lpage>76</lpage>
          <pub-id pub-id-type="doi">10.1007/s00500-019-04269-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B36">
        <label>36</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Xia</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Lyu</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Feng</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Partial label learning with noisy side information</article-title>
          <source>Appl Intell</source>
          <year>2022</year>
          <volume>52</volume>
          <fpage>12382</fpage>
          <lpage>96</lpage>
          <pub-id pub-id-type="doi">10.1007/s10489-021-03137-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B37">
        <label>37</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Gong</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Zhou</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Jing</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Convolutional attention-based contrastive learning for partial label learning</article-title>
          <source>Appl Intell</source>
          <year>2025</year>
          <volume>55</volume>
          <fpage>868</fpage>
          <pub-id pub-id-type="doi">10.1007/s10489-025-06757-y</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B38">
        <label>38</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Wan</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Vong</surname>
              <given-names>CM</given-names>
            </name>
          </person-group>
          <article-title>Multi-kernel partial label learning using graph contrast disambiguation</article-title>
          <source>Appl Intell</source>
          <year>2024</year>
          <volume>54</volume>
          <fpage>9760</fpage>
          <lpage>82</lpage>
          <pub-id pub-id-type="doi">10.1007/s10489-024-05639-z</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B39">
        <label>39</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>ML</given-names>
            </name>
            <name>
              <surname>Yu</surname>
              <given-names>F</given-names>
            </name>
            <name>
              <surname>Tang</surname>
              <given-names>CZ</given-names>
            </name>
          </person-group>
          <article-title>Disambiguation-free partial label learning</article-title>
          <source>IEEE Trans Knowl Data Eng</source>
          <year>2017</year>
          <volume>29</volume>
          <fpage>2155</fpage>
          <lpage>67</lpage>
          <pub-id pub-id-type="doi">10.1109/TKDE.2017.2721942</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B40">
        <label>40</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Lyu</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Feng</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Lang</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>GM-PLL: Graph matching based partial label learning</article-title>
          <source>IEEE Trans Knowl Data Eng</source>
          <year>2021</year>
          <volume>33</volume>
          <fpage>521</fpage>
          <lpage>35</lpage>
          <pub-id pub-id-type="doi">10.1109/TKDE.2019.2933837</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B41">
        <label>41</label>
        <nlm-citation publication-type="web">
          <person-group person-group-type="author">
            <name>
              <surname>Feng</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Lv</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Han</surname>
              <given-names>B</given-names>
            </name>
            <etal />
          </person-group>
          <comment>Provably consistent partial-label learning. <italic>arXiv</italic> <bold>2020</bold>, arXiv:2007.08929. Available online: <uri xlink:href="https://doi.org/10.48550/arXiv.2007.08929">https://doi.org/10.48550/arXiv.2007.08929</uri>. (accessed 2026-06-26)</comment>
        </nlm-citation>
      </ref>
      <ref id="B42">
        <label>42</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Liu</surname>
              <given-names>LP</given-names>
            </name>
            <name>
              <surname>Dietterich</surname>
              <given-names>TG</given-names>
            </name>
          </person-group>
          <comment>Learnability of the superset label learning problem. In <italic>International Conference on Machine Learning</italic>. 2014. <uri xlink:href="https://api.semanticscholar.org/CorpusID:17882853">https://api.semanticscholar.org/CorpusID:17882853</uri>. (accessed 2026-06-26)</comment>
        </nlm-citation>
      </ref>
      <ref id="B43">
        <label>43</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Xu</surname>
              <given-names>N</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Lv</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Qiao</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Geng</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <comment>Progressive purification for instance-dependent partial label learning. In <italic>Proceedings of the 40th International Conference on Machine Learning</italic>. PMLR: 2023; pp. 38551-65. <uri xlink:href="https://proceedings.mlr.press/v202/xu23l.html">https://proceedings.mlr.press/v202/xu23l.html</uri>. (accessed 2026-06-26)</comment>
        </nlm-citation>
      </ref>
      <ref id="B44">
        <label>44</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>ML</given-names>
            </name>
            <name>
              <surname>Fang</surname>
              <given-names>JP</given-names>
            </name>
          </person-group>
          <article-title>Partial multi-label learning via credible label elicitation</article-title>
          <source>IEEE Trans Pattern Anal Mach Intell</source>
          <year>2021</year>
          <volume>43</volume>
          <fpage>3587</fpage>
          <lpage>99</lpage>
          <pub-id pub-id-type="doi">10.1109/TPAMI.2020.2985210</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B45">
        <label>45</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Zhao</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Hu</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Chen</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <comment>Discriminative and correlative partial multi-label learning. In <italic>Proceedings of the Twenty-Eighth International Joint Conference on Artificial Intelligence</italic>. 2019; pp. 3691-7.</comment>
          <pub-id pub-id-type="doi">10.24963/ijcai.2019/512</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B46">
        <label>46</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Yu</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Domeniconi</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <comment>Feature-induced partial multi-label learning. In <italic>2018 IEEE international conference on data mining (ICDM)</italic>, Singapore, Nov 17-20, 2018. IEEE; 2018. pp. 1398-403.</comment>
          <pub-id pub-id-type="doi">10.1109/ICDM.2018.00192</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B47">
        <label>47</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Gong</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Yuan</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Bao</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <comment>Understanding partial multi-label learning via mutual information. In <italic>35th Conference on Neural Information Processing Systems (NeurIPS 2021)</italic>. 2021; pp. 4147-56. <uri xlink:href="https://proceedings.neurips.cc/paper/2021/file/217c0e01c1828e7279051f1b6675745d-Paper.pdf">https://proceedings.neurips.cc/paper/2021/file/217c0e01c1828e7279051f1b6675745d-Paper.pdf</uri>. (accessed 2026-06-26)</comment>
        </nlm-citation>
      </ref>
      <ref id="B48">
        <label>48</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Wu</surname>
              <given-names>JH</given-names>
            </name>
            <name>
              <surname>Wu</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Chen</surname>
              <given-names>QG</given-names>
            </name>
            <name>
              <surname>Hu</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>ML</given-names>
            </name>
          </person-group>
          <comment>Feature-induced manifold disambiguation for multi-view partial multi-label learning. In <italic>Proceedings of the 26th ACM SIGKDD International Conference on Knowledge Discovery &amp; Data Mining</italic>. Association for Computing Machinery: 2020; pp. 557-65.</comment>
          <pub-id pub-id-type="doi">10.1145/3394486.3403098</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B49">
        <label>49</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Hao</surname>
              <given-names>P</given-names>
            </name>
            <name>
              <surname>Hu</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Gao</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Partial multi-label feature selection via subspace optimization</article-title>
          <source>Inf Sci</source>
          <year>2023</year>
          <volume>648</volume>
          <fpage>119556</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ins.2023.119556</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B50">
        <label>50</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Hang</surname>
              <given-names>JY</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>ML</given-names>
            </name>
          </person-group>
          <comment>Partial multi-label learning with probabilistic graphical disambiguation. In <italic>37th Conference on Neural Information Processing Systems (NeurIPS 2023)</italic>. 2023; pp. 1339-51. <uri xlink:href="https://proceedings.neurips.cc/paper_files/paper/2023/file/04e05ba5cbc36044f6499d1edf15247e-Paper-Conference.pdf">https://proceedings.neurips.cc/paper_files/paper/2023/file/04e05ba5cbc36044f6499d1edf15247e-Paper-Conference.pdf</uri>. (accessed 2026-06-26)</comment>
        </nlm-citation>
      </ref>
      <ref id="B51">
        <label>51</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>F</given-names>
            </name>
            <name>
              <surname>Han</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Tang</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Wan</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>PML-ED: a method of partial multi-label learning by using encoder-decoder framework and exploring label correlation</article-title>
          <source>Inf Sci</source>
          <year>2024</year>
          <volume>661</volume>
          <fpage>120165</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ins.2024.120165</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B52">
        <label>52</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Huang</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Gu</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Bu</surname>
              <given-names>Q</given-names>
            </name>
            <name>
              <surname>Qi</surname>
              <given-names>F</given-names>
            </name>
            <name>
              <surname>Fan</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Partial multi-label learning via K-means graph transformer</article-title>
          <source>Knowl Based Syst</source>
          <year>2025</year>
          <volume>325</volume>
          <fpage>114017</fpage>
          <pub-id pub-id-type="doi">10.1016/j.knosys.2025.114017</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B53">
        <label>53</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Qi</surname>
              <given-names>F</given-names>
            </name>
            <name>
              <surname>Huang</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Feng</surname>
              <given-names>J</given-names>
            </name>
            <etal />
          </person-group>
          <comment>Nonlinear characteristic-driven partial multi-label learning. In <italic>Advances in Knowledge Discovery and Data Mining</italic>. Springer Nature Singapore: 2026; pp. 442-54.</comment>
          <pub-id pub-id-type="doi">10.1007/978-981-92-1300-9_35</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B54">
        <label>54</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Yang</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Ma</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Win</surname>
              <given-names>KT</given-names>
            </name>
            <name>
              <surname>Gao</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Low-rank and sparse representation based learning for cancer survivability prediction</article-title>
          <source>Inf Sci</source>
          <year>2022</year>
          <volume>582</volume>
          <fpage>573</fpage>
          <lpage>92</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ins.2021.10.013</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B55">
        <label>55</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Fan</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Yu</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Addressing label ambiguity imbalance in candidate labels: measures and disambiguation algorithm</article-title>
          <source>Inf Sci</source>
          <year>2022</year>
          <volume>612</volume>
          <fpage>1</fpage>
          <lpage>19</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ins.2022.07.175</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B56">
        <label>56</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>P</given-names>
            </name>
            <name>
              <surname>Gao</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Feature relevance term variation for multi-label feature selection</article-title>
          <source>Appl Intell</source>
          <year>2021</year>
          <volume>51</volume>
          <fpage>5095</fpage>
          <lpage>110</lpage>
          <pub-id pub-id-type="doi">10.1007/s10489-020-02129-w</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B57">
        <label>57</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Gao</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Hu</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Feature redundancy based on interaction information for multi-label feature selection</article-title>
          <source>IEEE Access</source>
          <year>2020</year>
          <volume>8</volume>
          <fpage>146050</fpage>
          <lpage>64</lpage>
          <pub-id pub-id-type="doi">10.1109/ACCESS.2020.3015755</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B58">
        <label>58</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Auricchio</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Brigati</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Giudici</surname>
              <given-names>P</given-names>
            </name>
            <name>
              <surname>Toscani</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Multivariate Gini-type discrepancies</article-title>
          <source>Math Models Methods Appl Sci</source>
          <year>2025</year>
          <volume>35</volume>
          <fpage>1267</fpage>
          <lpage>96</lpage>
          <pub-id pub-id-type="doi">10.1142/S0218202525500174</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B59">
        <label>59</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Lin</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Su</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <comment>Linearized alternating direction method with adaptive penalty for low-rank representation. In <italic>Proceedings of the 25th International Conference on Neural Information Processing Systems</italic>. Curran Associates Inc.: 2011; pp. 612-20.</comment>
          <pub-id pub-id-type="doi">10.5555/2986459.2986528</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B60">
        <label>60</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Huiskes</surname>
              <given-names>MJ</given-names>
            </name>
            <name>
              <surname>Lew</surname>
              <given-names>MS</given-names>
            </name>
          </person-group>
          <comment>The MIR flickr retrieval evaluation. In <italic>Proceedings of the 1st ACM International Conference on Multimedia Information Retrieval</italic>. Association for Computing Machinery: 2008; pp. 39-43.</comment>
          <pub-id pub-id-type="doi">10.1145/1460096.1460104</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B61">
        <label>61</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Katakis</surname>
              <given-names>I</given-names>
            </name>
            <name>
              <surname>Tsoumakas</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Vlahavas</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <comment>Multilabel text classification for automated tag suggestion. 2008. <uri xlink:href="https://api.semanticscholar.org/CorpusID:15676013">https://api.semanticscholar.org/CorpusID:15676013</uri>. (accessed 2026-06-26)</comment>
        </nlm-citation>
      </ref>
      <ref id="B62">
        <label>62</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Briggs</surname>
              <given-names>F</given-names>
            </name>
            <name>
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Raich</surname>
              <given-names>R</given-names>
            </name>
            <etal />
          </person-group>
          <comment>The 9th annual MLSP competition: new methods for acoustic classification of multiple simultaneous bird species in a noisy environment. In <italic>2013 IEEE international workshop on machine learning for signal processing (MLSP)</italic>, Southampton, UK, Sep 22-25, 2013. IEEE; 2013. p. 1-8.</comment>
          <pub-id pub-id-type="doi">10.1109/MLSP.2013.6661934</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B63">
        <label>63</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Trohidis</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Tsoumakas</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Kalliris</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Vlahavas</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <comment>Multi-label classification of music into emotions. 2008; pp. 325-30. <uri xlink:href="https://www.researchgate.net/publication/288623967_Multilabel_classification_of_music_into_emotions">https://www.researchgate.net/publication/288623967_Multilabel_classification_of_music_into_emotions</uri>. (accessed 2026-06-26)</comment>
        </nlm-citation>
      </ref>
      <ref id="B64">
        <label>64</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Pestian</surname>
              <given-names>JP</given-names>
            </name>
            <name>
              <surname>Brew</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Matykiewicz</surname>
              <given-names>P</given-names>
            </name>
            <etal />
          </person-group>
          <comment>A shared task involving multi-label classification of clinical free text. In <italic>Biological, translational, and clinical language processing</italic>, Prague, Czech Republic, 2007. Association for Computational Linguistics: 2007; pp. 97-104. <uri xlink:href="https://aclanthology.org/W07-1013/">https://aclanthology.org/W07-1013/</uri>. (accessed 2026-06-26)</comment>
        </nlm-citation>
      </ref>
      <ref id="B65">
        <label>65</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Lyu</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Feng</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Noisy label tolerance: a new perspective of partial multi-label learning</article-title>
          <source>Inf Sci</source>
          <year>2021</year>
          <volume>543</volume>
          <fpage>454</fpage>
          <lpage>66</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ins.2020.09.019</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B66">
        <label>66</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Yang</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Lyu</surname>
              <given-names>G</given-names>
            </name>
            <etal />
          </person-group>
          <comment>Deep partial multi-label learning with graph disambiguation. <italic>arXiv</italic> <bold>2023</bold>, arXiv:2305.05882. Available online: <uri xlink:href="https://doi.org/10.48550/arXiv.2305.05882">https://doi.org/10.48550/arXiv.2305.05882</uri>. (accessed 2026-06-26)</comment>
        </nlm-citation>
      </ref>
      <ref id="B67">
        <label>67</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Fan</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Lu</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Huang</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Partial multi-label learning via transformer to discover discriminative label embeddings</article-title>
          <source>Neurocomputing</source>
          <year>2026</year>
          <volume>684</volume>
          <fpage>133518</fpage>
          <pub-id pub-id-type="doi">10.1016/j.neucom.2026.133518</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B68">
        <label>68</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Demšar</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Statistical comparisons of classifiers over multiple data sets</article-title>
          <source>J Mach Learn Res</source>
          <year>2006</year>
          <volume>7</volume>
          <fpage>1</fpage>
          <lpage>30</lpage>
		  <comment><uri xlink:href="https://www.jmlr.org/papers/volume7/demsar06a/demsar06a.pdf">https://www.jmlr.org/papers/volume7/demsar06a/demsar06a.pdf</uri>. (accessed 2026-06-26)</comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>