﻿<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.0 20120330//EN" "http://jats.nlm.nih.gov/publishing/1.0/JATS-journalpublishing1.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="nlm-ta">J. Mater. Inf.</journal-id>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-title-group>
        <journal-title>Journal of Materials Informatics</journal-title>
      </journal-title-group>
      <issn pub-type="epub">2770-372X</issn>
      <publisher>
        <publisher-name>OAE Publishing Inc.</publisher-name>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.20517/jmi.2026.02</article-id>
      <article-categories>
        <subj-group>
          <subject>Research Article</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Intelligent visualization-driven materials design via two-dimensional symbolic feature generation</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author">
          <name>
            <surname>Yong</surname>
            <given-names>Wei</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
          <xref ref-type="aff" rid="I#">
            <sup>#</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author" corresp="yes">
          <name>
            <surname>Zhang</surname>
            <given-names>Hongtao</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
          <xref ref-type="aff" rid="I2">
            <sup>2</sup>
          </xref>
          <xref ref-type="aff" rid="I3">
            <sup>3</sup>
          </xref>
          <xref ref-type="aff" rid="I4">
            <sup>4</sup>
          </xref>
          <xref ref-type="aff" rid="I#">
            <sup>#</sup>
          </xref>
          <xref ref-type="aff" rid="I*">
            <sup>*</sup>
          </xref>
          <xref ref-type="corresp" rid="cor1" />
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Li</surname>
            <given-names>Zhuang</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>He</surname>
            <given-names>Jie</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Chen</surname>
            <given-names>Chubo</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Gao</surname>
            <given-names>Yaxin</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author" corresp="yes">
          <name>
            <surname>Fu</surname>
            <given-names>Huadong</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
          <xref ref-type="aff" rid="I2">
            <sup>2</sup>
          </xref>
          <xref ref-type="aff" rid="I3">
            <sup>3</sup>
          </xref>
          <xref ref-type="aff" rid="I4">
            <sup>4</sup>
          </xref>
          <xref ref-type="aff" rid="I5">
            <sup>5</sup>
          </xref>
          <xref ref-type="aff" rid="I*">
            <sup>*</sup>
          </xref>
          <xref ref-type="corresp" rid="cor1" />
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Xie</surname>
            <given-names>Jianxin</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
          <xref ref-type="aff" rid="I2">
            <sup>2</sup>
          </xref>
          <xref ref-type="aff" rid="I3">
            <sup>3</sup>
          </xref>
          <xref ref-type="aff" rid="I4">
            <sup>4</sup>
          </xref>
          <xref ref-type="aff" rid="I5">
            <sup>5</sup>
          </xref>
        </contrib>
      </contrib-group>
      <aff id="I1">
        <sup>1</sup>Beijing Advanced Innovation Center for Materials Genome Engineering, School of Advanced Materials Innovation, University of Science and Technology Beijing, Beijing 100083, China.</aff>
      <aff id="I2">
        <sup>2</sup>Beijing Key Laboratory of Materials Intelligent Technology, School of Advanced Materials Innovation, University of Science and Technology Beijing, Beijing 100083, China.</aff>
      <aff id="I3">
        <sup>3</sup>Beijing Laboratory of Metallic Materials and Processing for Modern Transportation, School of Advanced Materials Innovation, University of Science and Technology Beijing, Beijing 100083, China.</aff>
      <aff id="I4">
        <sup>4</sup>Key Laboratory for Advanced Materials Processing (MOE), School of Advanced Materials Innovation, University of Science and Technology Beijing, Beijing 100083, China.</aff>
      <aff id="I5">
        <sup>5</sup>Institute of Materials Intelligent Technology, Liaoning Academy of Materials, Shenyang 110004, Liaoning, China.</aff>
      <aff id="I#">
        <sup>#</sup>Authors contributed equally to this work.</aff>
      <author-notes>
        <corresp id="cor1"><sup>*</sup>Correspondence to: Prof. Hongtao Zhang, Prof. Huadong Fu, Beijing Advanced Innovation Center for Materials Genome Engineering, School of Advanced Materials Innovation, University of Science and Technology Beijing, Beijing 100083, China. E-mail: <email>zht@ustb.edu.cn</email>; <email>hdfu@ustb.edu.cn</email></corresp>
        <fn fn-type="other">
          <p>
            <bold>Received:</bold> 27 Jan 2026 | <bold>First Decision:</bold> 13 Feb 2026 | <bold>Revised:</bold> 11 Mar 2026 | <bold>Accepted:</bold> 26 Mar 2026 | <bold>Published:</bold> 25 Jun 2026</p>
        </fn>
        <fn fn-type="other">
          <p>
            <bold>Academic Editor:</bold> Sergei Manzhos | <bold>Copy Editor:</bold> Pei-Yun Wang | <bold>Production Editor:</bold> Pei-Yun Wang</p>
        </fn>
      </author-notes>
      <pub-date pub-type="ppub">
        <year>2026</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>25</day>
        <month>6</month>
        <year>2026</year>
      </pub-date>
      <volume>6</volume>
	  <issue>2</issue>
      <elocation-id>34</elocation-id>
      <permissions>
        <copyright-statement>© The Author(s) 2026.</copyright-statement>
        <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
          <license-p>© The Author(s) 2026. <bold>Open Access</bold> This article is licensed under a Creative Commons Attribution 4.0 International License (<uri xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</uri>), which permits unrestricted use, sharing, adaptation, distribution and reproduction in any medium or format, for any purpose, even commercially, as long as you give appropriate credit to the original author(s) and the source, provide a link to the Creative Commons license, and indicate if changes were made.</license-p>
        </license>
      </permissions>
      <abstract>
        <p>Machine learning (ML) for complex materials problems suffers from high-dimensional data, while traditional “black-box” dimensionality reduction techniques generally fail to balance predictive accuracy with visualization and interpretability. This work presents a novel method, named two-dimensional symbolic feature generation (2D-SFG), based on symbolic regression and genetic algorithms. This approach facilitates ML by providing quantifiable interpretability and enabling visualization-driven materials design. Evaluated across diverse classification and regression tasks in materials science, the proposed method demonstrates notable success in three critical aspects. First, it significantly improves predictive accuracy. Specifically, the classification accuracies for ferroelectric perovskites and high-entropy alloy (HEA) phases improved from 85.6% and 84.5% to 94.2% and 88.4%, respectively. Correspondingly, the prediction errors for shape memory alloys and copper alloys were reduced from 2.9 K, 5.9%, and 9.7% to 1.1 K, 3.7%, and 6.2%, respectively. Second, the method ensures interpretability by constructing explicit mathematical expressions that transform the original high-dimensional features into two new symbolic ones, avoiding opaque spatial transformations. Third, it enables model visualization through two-dimensional (2D) contour maps that relate the constructed features to the target properties, thereby offering intuitive insights into feature–property relationships. Leveraging these “design roadmaps”, a refractory HEA with a single-phase solid solution and a precipitation-strengthened copper alloy with an optimized property trade-off were successfully designed. The 2D symbolic feature generation framework thus addresses key limitations in accuracy, interpretability, and visualization within materials informatics, establishing a new paradigm for transparent and visual materials design.</p>
      </abstract>
      <kwd-group>
        <kwd>Machine learning</kwd>
        <kwd>feature construction</kwd>
        <kwd>interpretability</kwd>
        <kwd>visualization-driven materials design</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec id="sec1">
      <title>INTRODUCTION</title>
      <p>In recent years, progress in artificial intelligence has empowered machine learning (ML) to achieve notable successes in materials development<sup>[<xref ref-type="bibr" rid="B1">1</xref>-<xref ref-type="bibr" rid="B6">6</xref>]</sup>. ML techniques have been effectively employed in composition design, process optimization, and property prediction across a variety of material systems, such as copper alloys<sup>[<xref ref-type="bibr" rid="B7">7</xref>-<xref ref-type="bibr" rid="B11">11</xref>]</sup>, high-entropy alloys (HEAs)<sup>[<xref ref-type="bibr" rid="B12">12</xref>-<xref ref-type="bibr" rid="B16">16</xref>]</sup>, superalloys<sup>[<xref ref-type="bibr" rid="B17">17</xref>-<xref ref-type="bibr" rid="B21">21</xref>]</sup>, steels<sup>[<xref ref-type="bibr" rid="B22">22</xref>-<xref ref-type="bibr" rid="B25">25</xref>]</sup>, and ferroelectric materials<sup>[<xref ref-type="bibr" rid="B26">26</xref>-<xref ref-type="bibr" rid="B30">30</xref>]</sup>, thereby pioneering a new paradigm for accelerated materials research and development.</p>
      <p>However, the pursuit of higher predictive accuracy in materials informatics is paradoxically leading to increasingly complex and large-scale models. Representative approaches, such as large language models<sup>[<xref ref-type="bibr" rid="B31">31</xref>-<xref ref-type="bibr" rid="B34">34</xref>]</sup> and deep reinforcement learning<sup>[<xref ref-type="bibr" rid="B6">6</xref>,<xref ref-type="bibr" rid="B21">21</xref>,<xref ref-type="bibr" rid="B35">35</xref>-<xref ref-type="bibr" rid="B37">37</xref>]</sup>, excel in composition design and property prediction. However, their massive parameters and multi-layer nonlinear transformations render them inherently uninterpretable “black boxes”. Consequently, these models operate via end-to-end input–output mappings without offering navigable guidance for materials design, effectively forcing blind exploration in high-dimensional spaces and thereby limiting both interpretability and the extraction of reusable design routes.</p>
      <p>To address the interpretability issues of complex models, mainstream analytical methods such as SHapley Additive exPlanations (SHAP)<sup>[<xref ref-type="bibr" rid="B38">38</xref>]</sup> and Local Interpretable Model-agnostic Explanations (LIME)<sup>[<xref ref-type="bibr" rid="B39">39</xref>]</sup> are commonly employed to evaluate feature importance. Alibagheri <italic>et al.</italic> developed a predictive model connecting electronic structure features to formation energy and subsequently applied SHAP analysis to rank feature contributions, revealing a negative correlation between average ionic charge and formation energy<sup>[<xref ref-type="bibr" rid="B40">40</xref>]</sup>. Similarly, Xu <italic>et al.</italic> employed SHAP to evaluate the influence of elemental composition and heat treatment parameters on the γ′ depletion zone thickness, providing valuable insights into thermal barrier coating bond coat design<sup>[<xref ref-type="bibr" rid="B41">41</xref>]</sup>. However, such post hoc interpretation techniques only yield qualitative rankings that lack physical grounding. They fail to establish quantitative mappings between physicochemical features and material properties, thus falling short of offering deep physical interpretability.</p>
      <p>To extract and reuse design pathways from complex models, projection-based dimensionality reduction techniques are commonly applied to visualize feature–property relationships in two-dimensional (2D) space. Chen <italic>et al.</italic> used principal component analysis (PCA)<sup>[<xref ref-type="bibr" rid="B43">43</xref>]</sup> to project multiple variables into a 2D space, successfully visualizing the stability boundary of the solid-solution phase in a five-component HEA system<sup>[<xref ref-type="bibr" rid="B42">42</xref>]</sup>. Their analysis identified melting point and mixing enthalpy as the primary factors determining phase stability. Srinivasan <italic>et al.</italic> employed the Isomap algorithm<sup>[<xref ref-type="bibr" rid="B45">45</xref>]</sup> to map high-dimensional descriptors of the Co<sub>3</sub>(Al, X) system into a low-dimensional space, generating a 2D point-line graph where elements were represented as nodes and descriptor similarities as edges<sup>[<xref ref-type="bibr" rid="B44">44</xref>]</sup>. This approach enabled the intuitive identification of candidate compositions with high binding energy, high melting point, and coherence with the Co-rich face-centered cubic matrix. Tian <italic>et al.</italic> applied uniform manifold approximation and projection (UMAP)<sup>[<xref ref-type="bibr" rid="B46">46</xref>]</sup> to reduce the 768-dimensional vectors from the steel-specialized large language model (SteelBERT) into a 2D space while preserving local topological structures<sup>[<xref ref-type="bibr" rid="B32">32</xref>]</sup>. The resulting “knowledge map of steel” was distinguished by keywords such as fatigue, irradiation, and welding, which intuitively revealed latent research hotspots and trends within the literature. These methods share the common objective of mapping high-dimensional data into a 2D space to generate clear and intuitive visualizations that facilitate the analysis and structural understanding of complex data. However, the relationships between the reduced-dimensional features and the original features remain obscure, making it impossible to analyze how dimensionality reduction influences feature representation and material properties.</p>
      <p>In summary, current approaches still exhibit significant limitations in providing model interpretability and the visualization of materials design. Previous studies have shown that algorithms such as symbolic regression and linear regression can establish explicit mathematical expressions linking material features to properties, presenting a viable path to overcome these shortcomings. Zhao <italic>et al.</italic> employed symbolic regression to establish an explicit mathematical expression linking alloy composition and thermal conditions to high-temperature specific yield strength, providing a closed-loop framework for the inverse design of refractory HEAs<sup>[<xref ref-type="bibr" rid="B47">47</xref>]</sup>. Xue <italic>et al.</italic> successfully developed a simple and interpretable polynomial regression expression relating the phase transformation temperature of NiTi-based shape memory alloys to crystal structure parameters<sup>[<xref ref-type="bibr" rid="B48">48</xref>]</sup>. Such approaches extract compact and physically informative expressions from materials data to guide design. However, their predictive accuracy is limited due to the oversimplification inherent in representing material behavior with only a small set of features.</p>
      <p>To address these challenges, this work proposes a novel two-dimensional symbolic feature generation (2D-SFG) method via genetic programming-based symbolic regression, enabling visual and interpretable materials design. By combining original features with mathematical operators, 2D-SFG constructs explicit mathematical expressions as new features, which are then used to generate 2D classification probability maps or property contour plots. This framework supports efficient and intuitive materials design. When applied to various classification and regression tasks, the proposed method simultaneously improves predictive accuracy, enhances interpretability, and enables design visualization, thereby establishing a new strategy for interpretable and visual materials design.</p>
    </sec>
    <sec id="sec2">
      <title>MATERIALS AND METHODS</title>
      <p>This work introduces a novel feature construction methodology designed to simultaneously enhance the predictive performance of ML models and provide explicit, interpretable feature representations. Mathematically, for a given ML problem formulated as <bold>target = <italic>f</italic> (<italic>x</italic><sub>1</sub>, <italic>x</italic><sub>2</sub>, …, <italic>x</italic><sub>n</sub>)</bold>, two new features are generated through symbolic regression: <bold><italic>X</italic><sub>1</sub> = <italic>F</italic><sub>1</sub> (<italic>x</italic><sub>1</sub>, <italic>x</italic><sub>2</sub>, …, <italic>x</italic><sub>n</sub>)</bold> and <bold><italic>X</italic><sub>2</sub> = <italic>F</italic><sub>2</sub> (<italic>x</italic><sub>1</sub>, <italic>x</italic><sub>2</sub>, …, <italic>x</italic><sub>n</sub>)</bold>. This transforms the original modeling task into <bold>target = <italic>g</italic> (<italic>X</italic><sub>1</sub>, <italic>X</italic><sub>2</sub>)</bold>, with the key constraint that the model based on these constructed features achieves superior accuracy or lower error compared to the initial model. Notably, <bold><italic>F</italic><sub>1</sub></bold> and <bold><italic>F</italic><sub>2</sub></bold> represent explicit mathematical relationships rather than uninterpretable black-box models. The overall workflow is illustrated in <xref ref-type="fig" rid="fig1">Figure 1</xref>.</p>
      <fig id="fig1" position="float">
        <label>Figure 1</label>
        <caption>
          <p>2D-SFG method. A novel feature construction strategy combining symbolic regression and genetic algorithms for 2D symbolic features. 2D-SFG: Two-dimensional symbolic feature generation; 2D: two-dimensional.</p>
        </caption>
        <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jmi6002.fig.1.jpg" />
      </fig>
      <p>First, features relevant to the modeling problem, such as composition, processing conditions, microstructure, and empirical knowledge, were collected to form an initial feature set. It is noteworthy that this set may comprise either raw, unscreened features or a pre-selected subset of key attributes identified in earlier research. Symbolic regression was then applied to construct new features in the form of explicit mathematical expression trees derived from the original features. This construction process constitutes the core of the proposed methodology, aiming to synthesize critical information from the initial feature set through interpretable mathematical expressions while eliminating redundancy and irrelevant details.</p>
      <p>However, since feature construction typically explores an expansive combinatorial space, an exhaustive search over all possible expressions is computationally infeasible. Therefore, an evolutionary optimization approach was introduced to address this issue. Newly constructed features were paired to form a “feature-pair set”, with the population size set to 500. Each feature pair served as the input for model training, and the resulting model was evaluated based on a fitness metric (e.g., accuracy or error) to retain high-performing feature pairs. Subsequently, crossover and mutation operations were applied to generate new feature-pair sets over 100 generations, progressively improving feature quality and model performance. In the Genetic Algorithm, Accuracy served as the fitness function for classification tasks, while mean absolute percentage error or root mean square error (RMSE) was employed for regression tasks. Concurrently, a hard constraint limiting the maximum number of nodes to fewer than 17 was imposed to balance model accuracy and formula interpretability. The pseudocode of the proposed 2D-SFG method is summarized in <xref ref-type="table" rid="t1">Table 1</xref>.</p>
      <table-wrap id="t1">
        <label>Table 1</label>
        <caption>
          <p>Pseudocode of the 2D-SFG method</p>
        </caption>
        <table frame="hsides" rules="groups">
          <thead>
            <tr>
              <td style="border-bottom:1;">
                <bold>Step</bold>
              </td>
              <td style="border-bottom:1;">
                <bold>Methods</bold>
              </td>
            </tr>
          </thead>
          <tbody>
            <tr>
              <td>
                <bold>1</bold>
              </td>
              <td>Let <inline-formula><tex-math id="M1">$$ \boldsymbol{\mathcal{D}_o} $$</tex-math></inline-formula><bold>: = {+, -, ×, ÷, …}</bold> and <inline-formula><tex-math id="M1">$$ \boldsymbol{\mathcal{D}_f} $$</tex-math></inline-formula><bold>: = {<italic>x</italic><sub>1</sub>, <italic>x</italic><sub>2</sub>, …, <italic>x</italic><italic><sub>n</sub></italic>}</bold> represent the operator symbol set and feature set, respectively.</td>
            </tr>
            <tr>
              <td>
                <bold>2</bold>
              </td>
              <td>Generate <bold><italic>N</italic></bold> formula trees <bold>{<italic>X</italic>}</bold> with elements randomly selected from the two sets in <bold>Step 1</bold>, e.g., <bold><italic>X</italic> = <italic>x</italic><italic><sub>i</sub></italic><italic>x</italic><italic><sub>k</sub></italic> - <italic>x</italic><italic><sub>j</sub></italic>, <italic>x</italic><italic><sub>i</sub></italic>/<italic>x</italic><italic><sub>j</sub></italic>, …</bold></td>
            </tr>
            <tr>
              <td>
                <bold>3</bold>
              </td>
              <td>A set of feature pairs, denoted as <inline-formula><tex-math id="M1">$$ \boldsymbol{\mathcal{D}_p} $$</tex-math></inline-formula>, was generated by sampling 2N times from {X} with replacement, i.e., <inline-formula><tex-math id="M1">$$ \boldsymbol{\mathcal{D}_p} $$</tex-math></inline-formula><bold> = {(<italic>X</italic><sub>1</sub><italic>, X</italic><sub>2</sub>), (<italic>X</italic><sub>3</sub>, <italic>X</italic><sub>4</sub>), (<italic>X</italic><sub>1</sub>, <italic>X</italic><sub>3</sub>), …}</bold>, in which <bold><italic>X</italic></bold> represents the formula tree in <bold>Step 2</bold>.</td>
            </tr>
            <tr>
              <td>
                <bold>4</bold>
              </td>
              <td>For each pair in <inline-formula><tex-math id="M1">$$ \boldsymbol{\mathcal{D}_p} $$</tex-math></inline-formula>, build a model with the two features as inputs and evaluate the model.</td>
            </tr>
            <tr>
              <td rowspan="2">
                <bold>5</bold>
              </td>
              <td>
                <bold>
                  <italic>If</italic>
                </bold> the stopping condition is <bold>not</bold> met:<break />Update the formula trees by genetic algorithm operations (<bold><italic>Selection</italic>, <italic>Crossover</italic>, <italic>Mutation</italic></bold>).<break />Repeat from <bold>Step 4</bold>.</td>
            </tr>
            <tr>
              <td>
                <bold>
                  <italic>Otherwise</italic>
                </bold>:<break />Return the optimal feature pair.</td>
            </tr>
            <tr>
              <td>
                <bold>End</bold>
              </td>
              <td />
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn>
            <p>2D-SFG: Two-dimensional symbolic feature generation.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <p>To mitigate symbolic overfitting and expression bloat, the following control mechanisms were implemented:</p>
      <p>• Operator &amp; Constant Restrictions: The search space was limited to the basic arithmetic operators {+, -, ×, /} and a fixed set of constants {0, 1, 2}. This avoids the complexity of optimizing floating-point coefficients and ensures analytical simplicity.<break/>• Structural Hard Constraints: A strict maximum limit of 17 nodes per symbolic tree was enforced. Any genetic operation violating this constraint was rejected.<break/>• No Explicit Penalties or Pruning: Unlike methods using description length penalties, the present approach relies on hard constraints to naturally limit complexity. Additionally, redundant sub-expressions (e.g., x+0) were simplified during generation, eliminating the need for post hoc pruning.<break/>• Numerical Stability: Protected division was employed to handle near-zero denominators, preventing numerical errors during fitness evaluation.<break/>• Dimensional Flexibility: No strict dimensional consistency was enforced, allowing the discovery of empirical dimensionless groups common in materials science.<break/>• Independent Test Set: A completely independent test set was established. The discrepancy in predictive performance between the training and test sets was utilized to evaluate the risk of overfitting.</p>
    </sec>
    <sec id="sec3">
      <title>RESULTS AND DISCUSSION</title>
      <sec id="sec3-1">
        <title>Material visualization classification model</title>
        <p>Feature dimensionality reduction techniques are commonly employed to map high-dimensional data into a lower-dimensional space for more intuitive visualization of sample distributions across classes in classification tasks, such as PCA. These methods primarily retain directions of maximum variance to highlight inter-class differences. However, high variance does not necessarily correspond to discriminative or physically meaningful information. For instance, noise may exhibit greater variance than critical target features. In such cases, reducing the input dimensionality can lead to the loss of important information, thereby damaging the classification performance of the model<sup>[<xref ref-type="bibr" rid="B49">49</xref>]</sup>. The proposed 2D-SFG method not only reduces the input dimensionality by constructing new features but also incorporates nonlinear combinations among features, thereby effectively preserving critical information from the original data while enhancing model visualization and improving predictive accuracy. To evaluate its effectiveness, we compared its performance with existing results in perovskite structural categorization and HEA phase classification, as reported in high-impact journals including <italic>Nature Communications</italic> and <italic>Acta Materialia</italic>.</p>
        <p>Balachandran <italic>et al.</italic> developed a support vector machine-based binary classification model using a dataset of 167 perovskite structures and five input features, achieving an average accuracy of 85.6%<sup>[<xref ref-type="bibr" rid="B30">30</xref>]</sup>. Based on HEA data gathered from references<sup>[<xref ref-type="bibr" rid="B50">50</xref>-<xref ref-type="bibr" rid="B52">52</xref>]</sup>, a phase classification model was built using ten influential features selected via a feature screening method, resulting in a prediction accuracy of 84.5%. The material features employed in the two classification tasks are presented in <xref ref-type="table" rid="t2">Table 2</xref>. Comprehensive details can be found in the <inline-supplementary-material content-type="local-data" mimetype="application/pdf" xlink:href="jmi6002-SupplementaryMaterials.pdf">Supplementary Materials</inline-supplementary-material>.</p>
        <table-wrap id="t2">
          <label>Table 2</label>
          <caption>
            <p>Features used in classification tasks</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Task</bold>
                </td>
                <td colspan="2" style="border-bottom:1;">
                  <bold>Features</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td rowspan="3">Perovskites</td>
                <td>
                  <bold>
                    <italic>f</italic>
                    <sub>0</sub>
                  </bold>: Tolerance factor</td>
                <td>
                  <bold>
                    <italic>f</italic>
                    <sub>1</sub>
                  </bold>: Valence electron number</td>
              </tr>
              <tr>
                <td>
                  <bold>
                    <italic>f</italic>
                    <sub>2</sub>
                  </bold>: Martynov-Batsanov electronegativity</td>
                <td>
                  <bold>
                    <italic>f</italic>
                    <sub>3</sub>
                  </bold>: Ideal bond length</td>
              </tr>
              <tr>
                <td>
                  <bold>
                    <italic>f</italic>
                    <sub>4</sub>
                  </bold>: Mendeleev number</td>
                <td />
              </tr>
              <tr>
                <td rowspan="5">HEAs</td>
                <td>
                  <bold>Δ<italic>H</italic><italic><sub>mix</sub></italic></bold>: Mixing enthalpy</td>
                <td>
                  <bold>
                    <italic>Xc</italic>
                  </bold>: Chemical bond mismatch</td>
              </tr>
              <tr>
                <td><inline-formula><tex-math id="M1">$$ \overline{MAC} $$</tex-math></inline-formula>: Mean mass attenuation coefficient</td>
                <td><inline-formula><tex-math id="M1">$$ \overline{EA} $$</tex-math></inline-formula>: Mean electron affinity</td>
              </tr>
              <tr>
                <td>
                  <bold>
                    <italic>δCE</italic>
                  </bold>: Cohesive energy deviation</td>
                <td><inline-formula><tex-math id="M1">$$ \overline{RM} $$</tex-math></inline-formula>: Mean rigidity modulus</td>
              </tr>
              <tr>
                <td><inline-formula><tex-math id="M1">$$ \overline{MN} $$</tex-math></inline-formula>: Mean Mendeleev number</td>
                <td>
                  <bold>
                    <italic>δMR</italic>
                  </bold>: Metal radius deviation</td>
              </tr>
              <tr>
                <td>
                  <bold>
                    <italic>δAV</italic>
                  </bold>: Atomic volume deviation</td>
                <td><inline-formula><tex-math id="M1">$$ \overline{LC} $$</tex-math></inline-formula>: Mean lattice constants <italic>a</italic></td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>HEAs: High-entropy alloys.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>
          <xref ref-type="fig" rid="fig2">Figure 2A</xref> and <xref ref-type="fig" rid="fig2">B</xref> illustrate the iterative feature generation process for the two classification cases. As the iterations proceed, the model accuracy gradually increases until it converges to a stable value. This trend indicates that the two new features generated by the 2D-SFG method incorporate more meaningful information to improve model performance. The explicit mathematical relationships of the evolved features after 100 iterations are shown in Equations (1) to (4).</p>
        <fig id="fig2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Application of the 2D-SFG method to classification tasks. (A and B) Iterative feature generation process; the red curve indicates the variation in optimal performance within the population; (C and D) Classification probability maps; the red arrows indicate the direction of increasing probability for the target property. 2D-SFG: Two-dimensional symbolic feature generation.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jmi6002.fig.2.jpg" />
		  </fig>
      <p><bold>Perovskites:</bold></p>
	  <p><disp-formula> <label>(1)</label> <tex-math id="E1"> $$  \boldsymbol{X_{c1}=f_3-f_3^2-f_2\times\frac{f_3}{f_1}} $$ </tex-math></disp-formula></p>
	  <p><disp-formula> <label>(2)</label> <tex-math id="E1"> $$  \boldsymbol{X_{c2}=f_4-f_2} $$ </tex-math></disp-formula></p>
      <p><bold>HEAs:</bold></p>
	  <p><disp-formula> <label>(3)</label> <tex-math id="E1"> $$  \boldsymbol{X_{c3}=\delta MR\times \delta AV\times \left ( 2\times \overline{MAC}\times\frac{\overline{EA}}{\overline{LC}}+\overline{RM}+\delta AV \right ) } $$ </tex-math></disp-formula></p>
	  <p><disp-formula> <label>(4)</label> <tex-math id="E1"> $$  \boldsymbol{X_{c4}=\overline{MN}-Xc+\frac{\delta AV}{\delta CE}+\frac{\overline{MN}}{\overline{EA}}} $$ </tex-math></disp-formula></p>
        <p>where <bold><italic>X<sub>C</sub></italic><sub>1</sub></bold>, <bold><italic>X<sub>C</sub></italic><sub>2</sub></bold>, <bold><italic>X<sub>C</sub></italic><sub>3</sub></bold>, and <bold><italic>X<sub>C</sub></italic><sub>4</sub></bold> denote the constructed symbolic features. Definitions of all other parameters are provided in <xref ref-type="table" rid="t2">Table 2</xref>.</p>
        <p>A support vector classifier was established using the constructed features, and the corresponding classification probability maps are shown in <xref ref-type="fig" rid="fig2">Figure 2C</xref> and <xref ref-type="fig" rid="fig2">D</xref>. On the one hand, these maps provide an intuitive representation of the ML model, in which the red arrows indicate the direction of increasing probability for the target property, forming a “navigation map” for alloy design. Based on the value range associated with the positive class, the compositional design window for ferroelectric perovskites without secondary phases and single solid-solution HEAs can be determined through either forward screening or inverse calculation. On the other hand, underlying patterns in the data can be revealed by analyzing the influence of the constructed features on the target property, particularly the transition boundaries. This approach offers possibilities for extracting physical interpretability and discovering new knowledge.</p>
      </sec>
      <sec id="sec3-2">
        <title>Material visualization regression model</title>
        <p>In regression tasks, the “curse of dimensionality” also poses a significant challenge. Although reducing the dimensionality of input variables can visualize the relationship between inputs and outputs, it is impossible to obtain the relationship between features before and after dimensionality reduction. The proposed 2D-SFG method can not only preserve meaningful information and eliminate redundancies during dimensionality reduction, but also provide explicit mathematical expressions that clarify the connections between the original and transformed features, as well as their influence on material properties. This approach significantly enhances model interpretability and offers valuable support for in-depth investigations into how key features affect performance mechanisms in materials science. To further assess the effectiveness of our approach, we selected studies on ML-assisted alloy design published in high-impact journals, including <italic>Nature Communications</italic> and <italic>Acta Materialia</italic>, for comparative validation.</p>
        <p>Xue <italic>et al.</italic> established a support vector regression prediction model using six input features to design NiTi-based shape memory alloys with low thermal hysteresis, achieving a prediction error of 2.9 K<sup>[<xref ref-type="bibr" rid="B53">53</xref>]</sup>. The authors<sup>[<xref ref-type="bibr" rid="B9">9</xref>]</sup> aimed to optimize both hardness and electrical conductivity in precipitation-strengthened copper alloys. Five key features influencing alloy hardness and six features affecting electrical conductivity were identified through feature selection. By constructing corresponding support vector regression prediction models, prediction errors of 5.9% and 9.7% were achieved, respectively. The material features used in these two regression tasks are summarized in <xref ref-type="table" rid="t3">Table 3</xref>, with additional details provided in the <inline-supplementary-material content-type="local-data" mimetype="application/pdf" xlink:href="jmi6002-SupplementaryMaterials.pdf">Supplementary Materials</inline-supplementary-material>.</p>
        <table-wrap id="t3">
          <label>Table 3</label>
          <caption>
            <p>Features used in regression tasks</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Task</bold>
                </td>
                <td colspan="2" style="border-bottom:1;">
                  <bold>Features</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td rowspan="3">Thermal hysteresis</td>
                <td>
                  <bold>
                    <italic>en</italic>
                  </bold>: Pauling electronegativity</td>
                <td>
                  <bold>
                    <italic>cs</italic>
                  </bold>: Pettifor chemical scale</td>
              </tr>
              <tr>
                <td>
                  <bold>
                    <italic>ven</italic>
                  </bold>: Valence electron number</td>
                <td>
                  <bold>
                    <italic>arc</italic>
                  </bold>: Clementi’s atomic radii</td>
              </tr>
              <tr>
                <td>
                  <bold>
                    <italic>dor</italic>
                  </bold>: Waber-Cromer pseudopotential radii</td>
                <td>
                  <bold>
                    <italic>mr</italic>
                  </bold>: Metallic radius</td>
              </tr>
              <tr>
                <td rowspan="3">Vickers hardness</td>
                <td>
                  <bold>
                    <italic>M.S3</italic>
                  </bold>: Covalent radii</td>
                <td>
                  <bold>
                    <italic>M.S12</italic>
                  </bold>: Lattice constant <italic>c</italic></td>
              </tr>
              <tr>
                <td>
                  <bold>
                    <italic>V.A8</italic>
                  </bold>: Mass attenuation coefficient variance</td>
                <td>
                  <bold>
                    <italic>V.S7</italic>
                  </bold>: Atom volume variance</td>
              </tr>
              <tr>
                <td>
                  <bold>
                    <italic>O12</italic>
                  </bold>: Solubility at room temperature</td>
                <td />
              </tr>
              <tr>
                <td rowspan="3">Electrical conductivity</td>
                <td>
                  <bold>
                    <italic>M.A10</italic>
                  </bold>: Mass attenuation coefficient</td>
                <td>
                  <bold>
                    <italic>M.S6</italic>
                  </bold>: Core electron distance</td>
              </tr>
              <tr>
                <td>
                  <bold>
                    <italic>M.E4</italic>
                  </bold>: Absolute electronegativity</td>
                <td>
                  <bold>
                    <italic>V.E6</italic>
                  </bold>: Second ionization energy</td>
              </tr>
              <tr>
                <td>
                  <bold>
                    <italic>M.C4</italic>
                  </bold>: Melting enthalpy</td>
                <td>
                  <bold>
                    <italic>HV</italic>
                  </bold>: Vickers hardness</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <p>
          <xref ref-type="fig" rid="fig3">Figure 3A</xref>-<xref ref-type="fig" rid="fig3">C</xref> illustrates the iterative feature generation process for the two regression cases. As the number of genetic iterations increases, the 10-fold cross-validation error progressively decreases, indicating that the two constructed features incorporate increasingly meaningful information and thereby contribute to model improvement. Notably, the error for the hardness regression task continued to decrease beyond 100 iterations. However, further increasing generations resulted in overly complex expressions. This finding reflects the need for more sophisticated mathematical representations to accurately model the underlying strengthening mechanisms and integrate the substantial information embedded within the original features. To balance model accuracy and expression complexity, the evolutionary process was terminated after 100 generations. The final mathematical expressions of the evolved features after 100 generations are provided in Equations (5) to (10).</p>
        <fig id="fig3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Application of the 2D-SFG method to regression tasks. (A-C) Iterative feature generation process; the red curve indicates the vibration in optimal performance within the population; (D-F) Contour maps of alloy properties; the red arrows indicate the gradient variation of the target property. 2D-SFG: Two-dimensional symbolic feature generation; RMSE: root mean square error; MAPE: mean absolute percentage error.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jmi6002.fig.3.jpg" />
        </fig>
        <p><bold>ΔT</bold>:</p>
        <p><disp-formula> <label>(5)</label> <tex-math id="E1"> $$  \boldsymbol{X_{R1}=(arc+dor)\times cs-dor-ven} $$ </tex-math></disp-formula></p>
		<p><disp-formula> <label>(6)</label> <tex-math id="E1"> $$  \boldsymbol{X_{R2}=\frac{en}{mr\times (2cs+arc+mr+en+dor)}} $$ </tex-math></disp-formula></p>
      <p><bold>HV:</bold></p>
        <p><disp-formula> <label>(7)</label> <tex-math id="E1"> $$  \boldsymbol{X_{R3}=\frac{M.S3+O12}{V.A8}+V.S7-O12-\frac{V.A8}{M.S12}} $$ </tex-math></disp-formula></p>
		<p><disp-formula> <label>(8)</label> <tex-math id="E1"> $$  \boldsymbol{X_{R4}=M.S3\times V.S7+M.S3-M.S12-\frac{V.S7-1}{V.A8\times O12-M.S3}} $$ </tex-math></disp-formula></p>
      <p><bold>EC:</bold></p>
        <p><disp-formula> <label>(9)</label> <tex-math id="E1"> $$  \boldsymbol{X_{R5}=M.A10\times M.S6-M.A10} $$ </tex-math></disp-formula></p>
		<p><disp-formula> <label>(10)</label> <tex-math id="E1"> $$  \boldsymbol{X_{R6}=\frac{M.A10}{M.S6\times HV}+3\times M.E4} $$ </tex-math></disp-formula></p>
        <p>where <bold><italic>X<sub>R</sub></italic><sub>1</sub></bold>, <bold><italic>X<sub>R</sub></italic><sub>2</sub></bold>, <bold><italic>X<sub>R</sub></italic><sub>3</sub></bold>, <bold><italic>X<sub>R</sub></italic><sub>4</sub></bold>, <bold><italic>X<sub>R</sub></italic><sub>5</sub></bold>, and <bold><italic>X<sub>R</sub></italic><sub>6</sub></bold> denote the constructed symbolic features. Definitions of all other parameters can be found in <xref ref-type="table" rid="t3">Table 3</xref>.</p>
        <p>Support vector regression models were established using the constructed features as input to predict alloy properties across different values, as visualized in <xref ref-type="fig" rid="fig3">Figure 3D</xref>-<xref ref-type="fig" rid="fig3">F</xref>. The red arrows in each contour plot indicate the gradient variation of the target property, serving as guidance for efficiently approaching the desired property objectives. For instance, thermal hysteresis is minimized when features <bold><italic>X<sub>R</sub></italic><sub>1</sub></bold> and <bold><italic>X<sub>R</sub></italic><sub>2</sub></bold> approach around 145 and 4.2 × 10<sup>-5</sup>, respectively. Accordingly, NiTi-based shape memory alloys with low thermal hysteresis can be designed by forward screening or inverse calculation of compositions that satisfy this specific feature range. Similarly, higher alloy hardness is achieved near <bold><italic>X<sub>R</sub></italic><sub>3</sub></bold> ≈ -4 and <bold><italic>X<sub>R</sub></italic><sub>4</sub></bold> ≈ -246, while superior electrical conductivity is attained around <bold><italic>X<sub>R</sub></italic><sub>5</sub></bold> ≈ 12.5 and <bold><italic>X<sub>R</sub></italic><sub>6</sub></bold> ≈ 14.2. These identified value ranges offer practical and interpretable design guidelines for developing copper alloys with an improved balance between hardness and electrical conductivity.</p>
      </sec>
      <sec id="sec3-3">
        <title>Intelligent visualization-driven materials design</title>
        <p>As illustrated in <xref ref-type="fig" rid="fig2">Figures 2</xref> and <xref ref-type="fig" rid="fig3">3</xref>, the 2D-SFG method effectively visualizes phase boundaries and property contours, enabling intuitive identification of target regions and variation trends. A direct correspondence between composition design windows and target properties was established by mapping candidate alloy compositions into 2D symbolic features. In this work, we employed the 2D-SFG method to construct visualization models that can compute symbolic features for unknown alloy compositions. These models were subsequently used to evaluate and predict target properties, successfully screening refractory HEAs with single solid-solution phases, as well as advanced copper alloy compositions with superior performance. In the V-Nb-Ti-W-Zr-Mo-Hf-Ta HEA system, a genetic algorithm was used to define a composition space with 1 at.% increments. The ten-dimensional features listed in <xref ref-type="table" rid="t2">Table 2</xref> were computed for each composition and projected into a 2D visualization space using Equations (3) and (4), thereby identifying candidate compositions with a high probability of forming solid-solution phases, as summarized in <xref ref-type="table" rid="t4">Table 4</xref>.</p>
        <table-wrap id="t4">
          <label>Table 4</label>
          <caption>
            <p>Composition of HEAs</p>
          </caption>
          <table frame="hsides" rules="groups" displaytype="1">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Alloy (at.%)</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>V</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Nb</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Ti</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>W</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Zr</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Mo</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Hf</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Ta</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td>HEA-1</td>
                <td>30</td>
                <td>29</td>
                <td>8</td>
                <td>12</td>
                <td>10</td>
                <td>9</td>
                <td>1</td>
                <td>1</td>
              </tr>
              <tr>
                <td>HEA-2</td>
                <td>30</td>
                <td>27</td>
                <td>18</td>
                <td>13</td>
                <td>10</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>HEAs: High-entropy alloys.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>
          <xref ref-type="fig" rid="fig4">Figure 4A</xref> displays the classification probability and evolutionary path of alloys across two generations, showing a clear design pathway toward higher solid-solution probability. The selected alloys were synthesized using vacuum arc melting and characterized by X-ray diffraction (XRD). As shown in <xref ref-type="fig" rid="fig4">Figure 4B</xref>, all as-cast alloys exhibit a single body-centered cubic (BCC) solid-solution phase, consistent with the predictions of the 2D-SFG method. <xref ref-type="fig" rid="fig4">Figure 4C</xref> compares the predictions of different visualization modeling approaches. While most methods struggle to accurately identify the phase structures of alloys with low solid-solution probabilities, as shown in <xref ref-type="fig" rid="fig4">Figure 4A</xref>, only the 2D-SFG method correctly predicts the phase structures of both alloys. These results underscore the strong generalization capability and classification accuracy of the proposed approach for phase identification in HEAs.</p>
        <fig id="fig4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>2D-SFG method for HEA design. (A) Local classification probability map; (B) XRD characterization results; (C) Phase prediction results obtained using different methods. 2D-SFG: Two-dimensional symbolic feature generation; HEA: high-entropy alloy; XRD: X-ray diffraction; BCC: body-centered cubic; PCA: principal component analysis; KPCA: kernel principal component analysis; LLE: locally linear embedding; MDS: multidimensional scaling.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jmi6002.fig.4.jpg" />
        </fig>
        <p>
          <xref ref-type="fig" rid="fig5">Figure 5</xref> illustrates the application of the constructed hardness and conductivity visualization models to the unexplored composition space of the Cu-Ni-Si system. A promising copper alloy composition, Cu-1.87Ni-0.55Si-0.47Co-0.11Mg-0.07Zr-0.21Zn, was identified on the performance Pareto front as exhibiting a favorable combination of high hardness and medium conductivity. The designed alloy was synthesized via vacuum induction melting, achieving a peak hardness of 275 HV and a corresponding electrical conductivity of 47.2 %IACS (International Annealed Copper Standard). As summarized in <xref ref-type="table" rid="t5">Table 5</xref>, the prediction performance of different design methods was compared. The 2D-SFG model demonstrated superior generalization capability, with all errors between experimental measurements and model predictions remaining below 7%, confirming its effectiveness in supporting the rational design of high-performance alloys.</p>
        <fig id="fig5" position="float" width="420">
          <label>Figure 5</label>
          <caption>
            <p>Properties of the designed alloys within the Cu-Ni-Si system. Blue solid dots represent the collected experimental dataset, while white hollow dots represent the explored composition design space. The dashed line indicates the identified Pareto front, and the solid red sphere marks the optimal alloy composition selected through the 2D-SFG-guided design approach. 2D-SFG: Two-dimensional symbolic feature generation; IACS: International Annealed Copper Standard.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jmi6002.fig.5.jpg" />
        </fig>
        <table-wrap id="t5">
          <label>Table 5</label>
          <caption>
            <p>Prediction results of properties obtained using different methods</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Methods</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>2D-SFG</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Direct</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>PCA</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>KPCA</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>LLE</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Isomap</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>MDS</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td>HV<sub>pred</sub> (HV)</td>
                <td>273</td>
                <td>268</td>
                <td>209</td>
                <td>233</td>
                <td>213</td>
                <td>215</td>
                <td>216</td>
              </tr>
              <tr>
                <td>Percentage error</td>
                <td>0.7%</td>
                <td>2.5%</td>
                <td>24.1%</td>
                <td>15.3%</td>
                <td>22.5%</td>
                <td>21.8%</td>
                <td>21.5%</td>
              </tr>
              <tr>
                <td>EC<sub>pred</sub> (%IACS)</td>
                <td>50.3</td>
                <td>43.8</td>
                <td>54.2</td>
                <td>46.6</td>
                <td>58.1</td>
                <td>37.6</td>
                <td>43.7</td>
              </tr>
              <tr>
                <td>Percentage error</td>
                <td>6.6%</td>
                <td>7.2%</td>
                <td>14.8%</td>
                <td>1.3%</td>
                <td>23.1%</td>
                <td>20.3%</td>
                <td>7.4%</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>2D-SFG: Two-dimensional symbolic feature generation; PCA: principal component analysis; KPCA: kernel principal component analysis; LLE: locally linear embedding; MDS: multidimensional scaling; IACS: International Annealed Copper Standard.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec id="sec3-4">
        <title>Performance of the intelligent visualization-driven materials design model</title>
        <p>To evaluate the performance of the 2D-SFG method in classification tasks, a comprehensive assessment was conducted using multiple metrics, including accuracy, precision, recall, F1 score, and area under the curve (AUC), as shown in <xref ref-type="fig" rid="fig6">Figure 6A</xref> and <xref ref-type="fig" rid="fig6">B</xref>. The model constructed using 2D-SFG features achieved accuracy and precision rates above 90% on both the training and test sets, with only minor differences between them, indicating no significant overfitting. The F1 score remained consistently above 0.9, reflecting a well-balanced trade-off between precision and recall. Furthermore, the AUC values for both the training and test sets were significantly higher than the 0.9 threshold, demonstrating the model’s strong discriminative ability for classification boundaries and reliability for practical applications.</p>
        <fig id="fig6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>Performance of the 2D-SFG method on classification problems. (A and B) Evaluation metrics of the classification models; (C) Comparison of modeling accuracy between direct modeling and symbolic feature generation; (D) Comparison of multiple dimensionality reduction methods with the 2D-SFG method. Error bars indicate the standard deviation obtained from 10-fold cross-validation. 2D-SFG: Two-dimensional symbolic feature generation; AUC: area under the curve; PCA: principal component analysis; KPCA: kernel principal component analysis; LLE: locally linear embedding; MDS: multidimensional scaling.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jmi6002.fig.6.jpg" />
        </fig>
        <p>A comparative analysis was conducted between direct modeling and the 2D-SFG approach, as illustrated in <xref ref-type="fig" rid="fig6">Figure 6C</xref>. The direct modeling method utilized the initial feature set from <xref ref-type="table" rid="t2">Table 2</xref> as input, while the 2D-SFG approach employed the new features defined in Equations (1) to (4). It should be noted that both methods were evaluated using the same training and test datasets and underwent hyperparameter optimization. The 2D-SFG model achieved prediction accuracies of 94.2% for perovskite structure classification and 88.4% for HEA phase classification, outperforming the initial feature-based model, which achieved 85.6% and 84.5%, respectively. These results demonstrate that the 2D-SFG method effectively extracts meaningful information from the original features while reducing interference from redundant or irrelevant data.</p>
        <p>From the perspective of feature reduction, the proposed 2D-SFG method can also be regarded as a dimensionality reduction technique. To evaluate its effectiveness, this work compared it against several common dimensionality reduction methods, including PCA, kernel principal component analysis (KPCA)<sup>[<xref ref-type="bibr" rid="B54">54</xref>]</sup>, locally linear embedding (LLE)<sup>[<xref ref-type="bibr" rid="B55">55</xref>]</sup>, Isomap, and multidimensional scaling (MDS)<sup>[<xref ref-type="bibr" rid="B56">56</xref>]</sup>. All methods were configured to reduce the original features to two dimensions before model construction. As shown in <xref ref-type="fig" rid="fig6">Figure 6D</xref>, models using features from conventional reduction methods exhibited varying degrees of accuracy degradation, indicating the loss of critical information during the reduction process. In contrast, the 2D-SFG approach not only preserved essential information but also enhanced predictive accuracy, demonstrating its superior applicability for classification tasks.</p>
        <p>For the regression tasks, a similar comparative analysis was performed among direct modeling, 2D-SFG modeling, and models built using common dimensionality reduction methods, evaluated through 10-fold cross-validation. The evaluation was based on RMSE and percentage error metrics. As shown in <xref ref-type="fig" rid="fig7">Figure 7</xref>, models using conventional dimensionality reduction methods showed either no significant improvement or a slight increase in error, indicating the substantial limitations of these methods for regression tasks. In contrast, the 2D-SFG approach achieved prediction errors of 1.1 K, 3.7%, and 6.2% for the thermal hysteresis of shape memory alloys, and the hardness and electrical conductivity of copper alloys, respectively. These results are lower than the corresponding errors of 2.9 K, 5.9%, and 9.7% obtained using the original feature set, demonstrating the strong applicability of the 2D-SFG method to regression tasks.</p>
        <fig id="fig7" position="float">
          <label>Figure 7</label>
          <caption>
            <p>Comparison between multiple dimensionality reduction methods and the 2D-SFG method. (A) Thermal hysteresis of shape memory alloys; (B) Hardness and electric conductivity of copper alloys. Error bars indicate the standard deviations obtained from 10-fold cross-validation. 2D-SFG: Two-dimensional symbolic feature generation; RMSE: root mean square error; PCA: principal component analysis; KPCA: kernel principal component analysis; LLE: locally linear embedding; MDS: multidimensional scaling; MAPE: mean absolute percentage error.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jmi6002.fig.7.jpg" />
        </fig>
        <p>Although our primary analysis and discussion focused on the support vector machine algorithm due to its robustness in small-sample materials science problems, the core advantage of 2D-SFG, as a feature generation method for physics-informed knowledge discovery, lies in its ability to generate mathematical descriptors that explicitly encode physical mechanisms. This capability alleviates the burden on black-box models to implicitly extract features, thereby enhancing both predictive accuracy and generalization capability. To verify whether these performance gains are algorithm-agnostic, we conducted additional comparative studies using random forest (RF) and gradient boosting (GB) algorithms. The results, presented in <inline-supplementary-material content-type="local-data" mimetype="application/pdf" xlink:href="jmi6002-SupplementaryMaterials.pdf">Supplementary Table 3</inline-supplementary-material>, demonstrate that models trained on symbolic features generated by 2D-SFG consistently outperform those based on original feature inputs across all tested algorithms. These findings indicate that 2D-SFG serves as a versatile and seamlessly compatible module that can be integrated into diverse ML workflows. Extending the 2D-SFG framework to guide more complex architectures, such as Deep Neural Networks, will be a primary focus of our future work.</p>
      </sec>
      <sec id="sec3-5">
        <title>Generated feature importance and interpretability analysis</title>
        <p>The occurrence frequency of each original feature in the explicit expressions generated over 100 iterations was counted to assess feature importance, as illustrated in <xref ref-type="fig" rid="fig8">Figure 8</xref>. A higher frequency indicates greater importance of the corresponding feature. For instance, feature <bold><italic>f</italic><sub>0</sub></bold> does not appear in Equation (2), suggesting that its information is either redundant with that of the other four features or has limited influence on the target property. Consequently, it was discarded in later iterations, resulting in an overall frequency of less than 20. In the case of copper alloy hardness, all features exhibited occurrence frequencies above 100, reflecting their substantial individual importance and joint contribution to the target property. This also explains why the final explicit expression for hardness is mathematically more complex. In contrast, the electrical conductivity of precipitation-strengthened copper alloys is governed by a relatively simpler mechanism compared to hardness. As a result, meaningful information could be extracted from the original features using simpler mathematical operations, leading to a less complex symbolic expression for conductivity.</p>
        <fig id="fig8" position="float">
          <label>Figure 8</label>
          <caption>
            <p>Feature importance ranking. (A) Structure classification task for perovskites; (B) Phase classification task for HEAs; (C) Thermal hysteresis regression task for shape memory alloys; (D and E) Comprehensive property regression task for copper alloys; (F) Example of counting rules. HEAs: High-entropy alloys.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jmi6002.fig.8.jpg" />
        </fig>
        <p>This work successfully constructed new features for various material classification and regression problems through the 2D-SFG method. These features not only significantly enhance the predictive performance of ML models but also maintain explicit quantitative relationships with the original features, thereby improving physical interpretability in specific materials research problems. The 2D-SFG method is capable of constructing meaningful nonlinear combinations that capture complex physical interactions. Analysis of the specific mathematical forms of the generated symbolic features, such as products, ratios, and linear corrections, can further elucidate how feature co-occurrence influences target properties.</p>
        <p>In the classification tasks, the new feature <bold><italic>X<sub>C</sub></italic><sub>1</sub></bold> couples the bonding strength driven by electronegativity (<bold><italic>f</italic><sub>2</sub></bold>) with the valence electron number (<bold><italic>f</italic><sub>1</sub></bold>). This formulation reflects the electronic shielding effect, whereby a lower valence electron count amplifies the impact of charge rearrangement induced by electronegativity differences on lattice distortion. The formula demonstrates that perovskite formation requires not only geometric matching but also weighted correction of chemical bond polarity strength by electron concentration<sup>[<xref ref-type="bibr" rid="B57">57</xref>]</sup>. The new feature <bold><italic>X<sub>C</sub></italic><sub>3</sub></bold> employs a multiplicative form to quantify the nonlinear geometric distortion driving force arising from dual deviations in metal radius (<bold><italic>δMR</italic></bold>) and atomic volume (<bold><italic>δAV</italic></bold>). The formation of HEA solid solutions requires not only minimal geometric distortion but also sufficient intrinsic electronic properties and mechanical stiffness to effectively buffer and accommodate inevitable lattice strains<sup>[<xref ref-type="bibr" rid="B58">58</xref>,<xref ref-type="bibr" rid="B59">59</xref>]</sup>.</p>
        <p>In the regression tasks, the original features atomic radius (<bold><italic>arc</italic></bold>) and pseudopotential radius (<bold><italic>dor</italic></bold>), both associated with atomic size mismatch, frequently co-occur. Increases in these values can raise the distortion energy barrier, thereby increasing thermal hysteresis. The new feature <bold><italic>X<sub>R</sub></italic><sub>1</sub></bold> multiplies atomic size-related features by a chemical scaling parameter to capture the synergistic effect between atomic size mismatch and the chemical bonding environment, while subtracting the valence electron number (<bold><italic>ven</italic></bold>) to correct for the shielding effect on lattice distortion in systems with high electron concentrations. This formulation comprehensively reflects their combined influence on thermal hysteresis<sup>[<xref ref-type="bibr" rid="B60">60</xref>]</sup>. Furthermore, the new feature <bold><italic>X<sub>R</sub></italic><sub>2</sub></bold> is expressed as a ratio of electronegativity to multi-scale structural parameters. Physically, a larger denominator indicates stronger lattice distortion and greater resistance to the phase transformation driving force, while a larger numerator reflects more intense electron transfer and a higher phase transformation energy barrier. Consequently, a smaller <bold><italic>X<sub>R</sub></italic><sub>2</sub></bold> value facilitates easier phase transformation and corresponds to lower thermal hysteresis<sup>[<xref ref-type="bibr" rid="B61">61</xref>,<xref ref-type="bibr" rid="B62">62</xref>]</sup>. The new feature <bold><italic>X<sub>R</sub></italic><sub>5</sub></bold> is formulated as the product of the mass attenuation coefficient and the extranuclear electron distance. This construction captures the coupling between electron scattering efficiency and atomic size effects, where the extranuclear electron distance governs electron cloud distribution. Enhanced electron cloud overlap driven by this interaction leads to significantly improved conductivity. Additionally, the new feature <bold><italic>X<sub>R</sub></italic><sub>6</sub></bold> incorporates measured Vickers hardness and absolute electronegativity. This combination accounts for the effects of lattice distortion and dislocation density. The formulation aligns well with the established understanding that electrical conductivity in metallic systems is collectively determined by the interplay among lattice defects, solute atoms, and polarization effects<sup>[<xref ref-type="bibr" rid="B63">63</xref>-<xref ref-type="bibr" rid="B65">65</xref>]</sup>.</p>
        <p>The 2D-SFG method demonstrates a unique capability to automatically discover nonlinear descriptors that are difficult to predefine empirically. Although the resulting feature expressions may appear mathematically complex, each term corresponds to established physical models or empirical relationships in materials science. Furthermore, these explicit mathematical expressions effectively overcome the lack of physical insights inherent in black-box models. However, it is important to acknowledge certain limitations of the generated features: the physical universality of these expressions requires validation across broader material systems, and certain high-order interaction terms might introduce singularities. Future work should focus on enhancing the physical consistency and stability of the feature engineering process.</p>
      </sec>
      <sec id="sec3-6">
        <title>Analysis of the reuse effect of generated features</title>
        <p>To further evaluate whether the symbolic feature generation method successfully integrates and learns universal knowledge, the authors collected a dataset of aluminum alloys subjected to solution and aging treatments. This dataset includes alloy composition, processing parameters, hardness, and electrical conductivity. The initial features listed in <xref ref-type="table" rid="t3">Table 3</xref> were calculated, with the solid solubility of elements in aluminum used as a substitute for their solubility in copper. As shown in <xref ref-type="table" rid="t6">Table 6</xref>, calculating features <bold><italic>X<sub>R</sub></italic><sub>3</sub></bold> to <bold><italic>X<sub>R</sub></italic><sub>6</sub></bold> using the aluminum alloy dataset and retraining the model (Method A) yielded better predictive performance than the model trained with the original aluminum alloy features (Method B). For hardness prediction, Method A achieved cross-validation, training, and test errors of 9.9%, 7.5%, and 8.4%, respectively, representing an average reduction of 2.0% compared to Method B (10.9%, 9.6%, and 11.3%). Similarly, for electrical conductivity prediction, the errors decreased from 3.8%, 3.6%, and 5.3% to 2.9%, 1.1%, and 2.4%, corresponding to an average improvement of 2.1%. When a RF classifier was used instead, the 2D symbolic features still reduced the average hardness prediction error by 1.8% and the conductivity prediction error by 2.2%, confirming that the advantage stems from the features themselves rather than from algorithmic coincidence.</p>
        <table-wrap id="t6">
          <label>Table 6</label>
          <caption>
            <p>Prediction results of models under different methods</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td rowspan="2">
                  <bold>Methods</bold>
                </td>
                <td colspan="3">
                  <bold>Hardness</bold>
                </td>
                <td colspan="3">
                  <bold>Electrical conductivity</bold>
                </td>
              </tr>
              <tr>
                <td style="border-bottom:1;">
                  <bold>CV</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Training</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Testing</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>CV</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Training</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Testing</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td>Method A (SVR)</td>
                <td>
                  <bold>9.9%</bold>
                </td>
                <td>
                  <bold>7.5%</bold>
                </td>
                <td>
                  <bold>8.4%</bold>
                </td>
                <td>
                  <bold>2.9%</bold>
                </td>
                <td>
                  <bold>1.1%</bold>
                </td>
                <td>
                  <bold>2.4%</bold>
                </td>
              </tr>
              <tr>
                <td>Method B (SVR)</td>
                <td>10.9%</td>
                <td>9.6%</td>
                <td>11.3%</td>
                <td>3.8%</td>
                <td>3.6%</td>
                <td>5.3%</td>
              </tr>
              <tr>
                <td>Method A (RF)</td>
                <td>12.3%</td>
                <td>10.8%</td>
                <td>13.3%</td>
                <td>3.2%</td>
                <td>3.1%</td>
                <td>7.6%</td>
              </tr>
              <tr>
                <td>Method B (RF)</td>
                <td>14.5%</td>
                <td>11.6%</td>
                <td>15.7%</td>
                <td>4.3%</td>
                <td>5.7%</td>
                <td>10.5%</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>Bold values highlight the superior results achieved by the proposed method relative to the benchmark methods. CV: Cross-validation; SVR: support vector regression; RF: random forest.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>The distributional differences in feature values between copper and aluminum alloys pose a challenge for out-of-distribution generalization when copper alloy models are directly applied to aluminum alloy data. Although Method B was retrained using aluminum alloy data, the original features may still fail to capture the complex nonlinear relationships governing material properties. In contrast, the symbolically generated features derived from copper alloy data preserve the underlying mappings associated with alloy performance, as evidenced by the superior predictive performance of the aluminum alloy regression model (Method A) built with these features. The strong performance of Method A confirms both the applicability and effectiveness of the symbolically generated features, which not only retain key physical information learned through the 2D-SFG method but also adapt effectively to aluminum alloy data through refitting. The demonstrated predictive capability across both copper and aluminum alloy systems validates the transferability of the 2D-SFG method, offering a novel approach for cross-system materials modeling.</p>
      </sec>
    </sec>
    <sec id="sec4">
      <title>CONCLUSIONS</title>
      <p>This study aimed to overcome the dual challenges of limited model interpretability and the difficulty of extracting reusable design routes in materials informatics by developing a novel 2D-SFG method. Our findings demonstrate that integrating symbolic regression with genetic algorithms not only significantly enhances predictive accuracy across diverse material systems, but also yields compact mathematical formulas that align with classical physical models, thereby ensuring visualization and physically interpretable dimensionality reduction. Furthermore, the generated 2D feature maps provide intuitive visualizations of phase boundaries and property contours, effectively guiding the successful design of high-performance alloys without relying on black-box predictions. This interpretable framework lays the foundation for a fundamental shift in materials design methodology, moving from “black-box” exploration to “white-box” rational design by exploring the relationship between data and fundamental physical mechanisms.</p>
    </sec>
  </body>
  <back>
    <sec>
      <title>DECLARATIONS</title>
      <sec>
        <title>Authors’ contributions</title>
        <p>Carried out the majority of the modeling and experimental work: Yong, W.; Zhang, H.</p>
        <p>Contributed to the discussion and data analysis: Li, Z.; He, J.</p>
        <p>Conducted data collection: Chen, C.; Gao, Y.</p>
        <p>Designed the modeling approaches and supervised the research: Fu, H.; Xie, J.</p>
        <p>All authors interpreted the results and contributed to the writing of the paper.</p>
      </sec>
      <sec>
        <title>Availability of data and materials</title>
        <p>The data that support the findings of this study are available from the corresponding author upon reasonable request.</p>
      </sec>
      <sec>
        <title>AI and AI-assisted tools statement</title>
        <p>Not applicable.</p>
      </sec>
      <sec>
        <title>Financial support and sponsorship</title>
        <p>This work was supported by the National Major Science and Technology Projects of China (2024ZD0608100), the National Natural Science Foundation for Distinguished Young Scholars of China (No. 52425409), the National Natural Science Foundation of China (Nos. 52404387, 52374379, and U24A2029), the Xiaomi Young Scholars Program, and the Interdisciplinary Research Project for Young Teachers of USTB (Fundamental Research Funds for the Central Universities) (No. FRF-IDRY-23-002). The Article Processing Charge (APC) was fully funded by Shaanxi Sirui Advanced Materials Co., Ltd.</p>
      </sec>
      <sec>
        <title>Conflicts of interest</title>
        <p>Fu, H. is a Guest Editor of the Special Topic “AI-Driven Design and Intelligent Manufacturing of Advanced Copper Alloy” in <italic>Journal of Materials Informatics</italic>. He was not involved in any stage of the editorial process, notably including reviewer selection, manuscript handling, or decision making. The other authors declared that there are no conflicts of interest.</p>
      </sec>
      <sec>
        <title>Ethical approval and consent to participate</title>
        <p>Not applicable.</p>
      </sec>
      <sec>
        <title>Consent for publication</title>
        <p>Not applicable.</p>
      </sec>
      <sec>
        <title>Copyright</title>
        <p>© The Author(s) 2026.</p>
      </sec>
	<sec sec-type="supplementary-material">
      <title>Supplementary Materials</title>
          <supplementary-material content-type="local-data">
                <media xlink:href="jmi6002-SupplementaryMaterials.pdf" mimetype="application/pdf">
                        <caption>
                                <p>Supplementary Materials</p>
                        </caption>
                </media>
          </supplementary-material>

          </sec>  
    </sec>
    <ref-list>
      <ref id="B1">
        <label>1</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Rahman</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Hossain</surname>
              <given-names>MS</given-names>
            </name>
            <name>
              <surname>Siddique</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Review: machine learning approaches for diverse alloy systems</article-title>
          <source>J Mater Sci</source>
          <year>2025</year>
          <volume>60</volume>
          <fpage>12189</fpage>
          <lpage>221</lpage>
          <pub-id pub-id-type="doi">10.1007/s10853-025-11154-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B2">
        <label>2</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Hu</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Tan</surname>
              <given-names>Q</given-names>
            </name>
            <name>
              <surname>Knibbe</surname>
              <given-names>R</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Recent applications of machine learning in alloy design: a review</article-title>
          <source>Mater Sci Eng R Rep</source>
          <year>2023</year>
          <volume>155</volume>
          <fpage>100746</fpage>
          <pub-id pub-id-type="doi">10.1016/j.mser.2023.100746</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B3">
        <label>3</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Kumar</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Mukhopadhyay</surname>
              <given-names>NK</given-names>
            </name>
            <name>
              <surname>Yadav</surname>
              <given-names>TP</given-names>
            </name>
          </person-group>
          <article-title>Recent progresses on high entropy alloy development using machine learning: a review</article-title>
          <source>Comput Mater Today</source>
          <year>2025</year>
          <volume>8</volume>
          <fpage>100038</fpage>
          <pub-id pub-id-type="doi">10.1016/j.commt.2025.100038</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B4">
        <label>4</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Cheng</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Fu</surname>
              <given-names>CL</given-names>
            </name>
            <name>
              <surname>Okabe</surname>
              <given-names>R</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Artificial intelligence-driven approaches for materials design and discovery</article-title>
          <source>Nat Mater</source>
          <year>2026</year>
          <volume>25</volume>
          <fpage>174</fpage>
          <lpage>90</lpage>
          <pub-id pub-id-type="doi">10.1038/s41563-025-02403-7</pub-id>
          <pub-id pub-id-type="pmid">41482571</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B5">
        <label>5</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Hart</surname>
              <given-names>GLW</given-names>
            </name>
            <name>
              <surname>Mueller</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Toher</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Curtarolo</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Machine learning for alloys</article-title>
          <source>Nat Rev Mater</source>
          <year>2021</year>
          <volume>6</volume>
          <fpage>730</fpage>
          <lpage>55</lpage>
          <pub-id pub-id-type="doi">10.1038/s41578-021-00340-w</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B6">
        <label>6</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Merchant</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Batzner</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Schoenholz</surname>
              <given-names>SS</given-names>
            </name>
            <name>
              <surname>Aykol</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Cheon</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Cubuk</surname>
              <given-names>ED</given-names>
            </name>
          </person-group>
          <article-title>Scaling deep learning for materials discovery</article-title>
          <source>Nature</source>
          <year>2023</year>
          <volume>624</volume>
          <fpage>80</fpage>
          <lpage>5</lpage>
          <pub-id pub-id-type="doi">10.1038/s41586-023-06735-9</pub-id>
          <pub-id pub-id-type="pmid">38030720</pub-id>
          <pub-id pub-id-type="pmcid">PMC10700131</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B7">
        <label>7</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Feng</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Lu</surname>
              <given-names>Q</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Accelerated development of high-strength and high-conductivity Cu-Cr-Ti alloys based on data-driven design and experimental validation</article-title>
          <source>Mater Design</source>
          <year>2025</year>
          <volume>253</volume>
          <fpage>113948</fpage>
          <pub-id pub-id-type="doi">10.1016/j.matdes.2025.113948</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B8">
        <label>8</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Yin</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Lei</surname>
              <given-names>Q</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>A novel neural network-based alloy design strategy: gated recurrent unit machine learning modeling integrated with orthogonal experiment design and data augmentation</article-title>
          <source>Acta Mater</source>
          <year>2023</year>
          <volume>243</volume>
          <fpage>118420</fpage>
          <pub-id pub-id-type="doi">10.1016/j.actamat.2022.118420</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B9">
        <label>9</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Fu</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Zhu</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Yong</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Xie</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Machine learning assisted composition effective design for precipitation strengthened copper alloys</article-title>
          <source>Acta Mater</source>
          <year>2021</year>
          <volume>215</volume>
          <fpage>117118</fpage>
          <pub-id pub-id-type="doi">10.1016/j.actamat.2021.117118</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B10">
        <label>10</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Fu</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>He</surname>
              <given-names>X</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Dramatically enhanced combination of ultimate tensile strength and electric conductivity of alloys via machine learning screening</article-title>
          <source>Acta Mater</source>
          <year>2020</year>
          <volume>200</volume>
          <fpage>803</fpage>
          <lpage>10</lpage>
          <pub-id pub-id-type="doi">10.1016/j.actamat.2020.09.068</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B11">
        <label>11</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Yu</surname>
              <given-names>H</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>A machine learning strategy to achieve strength-conductivity-ductility synergy of high‐performance Cu-Ni-Co-Si alloys via rolling and aging process</article-title>
          <source>J Mater Sci Technol</source>
          <year>2026</year>
          <volume>267</volume>
          <fpage>184</fpage>
          <lpage>97</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jmst.2025.12.040</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B12">
        <label>12</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Sohail</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Xue</surname>
              <given-names>D</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Machine-learning design of ductile FeNiCoAlTa alloys with high strength</article-title>
          <source>Nature</source>
          <year>2025</year>
          <volume>643</volume>
          <fpage>119</fpage>
          <lpage>24</lpage>
          <pub-id pub-id-type="doi">10.1038/s41586-025-09160-2</pub-id>
          <pub-id pub-id-type="pmid">40533553</pub-id>
          <pub-id pub-id-type="pmcid">PMC12221976</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B13">
        <label>13</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Vazquez</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Chakravarty</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Gurrola</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Arróyave</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>A deep neural network regressor for phase constitution estimation in the high entropy alloy system Al-Co-Cr-Fe-Mn-Nb-Ni</article-title>
          <source>npj Comput Mater</source>
          <year>2023</year>
          <volume>9</volume>
          <fpage>1021</fpage>
          <pub-id pub-id-type="doi">10.1038/s41524-023-01021-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B14">
        <label>14</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Xu</surname>
              <given-names>Q</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>High-strength medium-entropy alloy designed by precipitation-strengthening mechanism via machine learning</article-title>
          <source>Mater Sci Eng A</source>
          <year>2023</year>
          <volume>882</volume>
          <fpage>145443</fpage>
          <pub-id pub-id-type="doi">10.1016/j.msea.2023.145443</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B15">
        <label>15</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Vela</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Khatamsaz</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Acemi</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Karaman</surname>
              <given-names>I</given-names>
            </name>
            <name>
              <surname>Arróyave</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Data-augmented modeling for yield strength of refractory high entropy alloys: a Bayesian approach</article-title>
          <source>Acta Mater</source>
          <year>2023</year>
          <volume>261</volume>
          <fpage>119351</fpage>
          <pub-id pub-id-type="doi">10.1016/j.actamat.2023.119351</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B16">
        <label>16</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Kwon</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Kim</surname>
              <given-names>HS</given-names>
            </name>
            <name>
              <surname>Lee</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>A neural network model for high entropy alloy design</article-title>
          <source>npj Comput Mater</source>
          <year>2023</year>
          <volume>9</volume>
          <fpage>1010</fpage>
          <pub-id pub-id-type="doi">10.1038/s41524-023-01010-x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B17">
        <label>17</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Yin</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Rao</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Wu</surname>
              <given-names>D</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Interpretable predicting creep rupture life of superalloys: enhanced by domain-specific knowledge</article-title>
          <source>Adv Sci</source>
          <year>2024</year>
          <volume>11</volume>
          <fpage>e2307982</fpage>
          <pub-id pub-id-type="doi">10.1002/advs.202307982</pub-id>
          <pub-id pub-id-type="pmid">38168537</pub-id>
          <pub-id pub-id-type="pmcid">PMC10953578</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B18">
        <label>18</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Lian</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Bao</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Xiong</surname>
              <given-names>Q</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Intelligent design of crack-resistant nickel-based superalloys for additive manufacturing by machine learning and multilayer filtering strategy</article-title>
          <source>Mater Today Commun</source>
          <year>2025</year>
          <volume>46</volume>
          <fpage>112387</fpage>
          <pub-id pub-id-type="doi">10.1016/j.mtcomm.2025.112387</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B19">
        <label>19</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhuang</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Antonov</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Lu</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Feng</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>Alloying effects and effective alloy design of high-Cr CoNi-based superalloys via a high-throughput experiments and machine learning framework</article-title>
          <source>Acta Mater</source>
          <year>2023</year>
          <volume>243</volume>
          <fpage>118525</fpage>
          <pub-id pub-id-type="doi">10.1016/j.actamat.2022.118525</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B20">
        <label>20</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Ma</surname>
              <given-names>Q</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Xin</surname>
              <given-names>R</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Thermodynamic calculation and machine learning aided composition design of new nickel-based superalloys</article-title>
          <source>J Mater Res Technol</source>
          <year>2023</year>
          <volume>26</volume>
          <fpage>4168</fpage>
          <lpage>78</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jmrt.2023.08.139</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B21">
        <label>21</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Yang</surname>
              <given-names>F</given-names>
            </name>
            <name>
              <surname>Zhao</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Ru</surname>
              <given-names>Y</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Deep learning accelerates the development of Ni-based single crystal superalloys: a physical-constrained neural network for creep rupture life prediction</article-title>
          <source>Mater Design</source>
          <year>2023</year>
          <volume>232</volume>
          <fpage>112174</fpage>
          <pub-id pub-id-type="doi">10.1016/j.matdes.2023.112174</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B22">
        <label>22</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Xin</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Zhong</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Xie</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Luo</surname>
              <given-names>F</given-names>
            </name>
            <name>
              <surname>Qiu</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Building an effective deep learning model for mechanical properties prediction of steel</article-title>
          <source>Mater Lett</source>
          <year>2026</year>
          <volume>402</volume>
          <fpage>139262</fpage>
          <pub-id pub-id-type="doi">10.1016/j.matlet.2025.139262</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B23">
        <label>23</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Kannan</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Nandwana</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Accelerated alloy discovery using synthetic data generation and data mining</article-title>
          <source>Scr Mater</source>
          <year>2023</year>
          <volume>228</volume>
          <fpage>115335</fpage>
          <pub-id pub-id-type="doi">10.1016/j.scriptamat.2023.115335</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B24">
        <label>24</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Wei</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>van der Zwaag</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Jia</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Xu</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>On the use of transfer modeling to design new steels with excellent rotating bending fatigue resistance even in the case of very small calibration datasets</article-title>
          <source>Acta Mater</source>
          <year>2022</year>
          <volume>235</volume>
          <fpage>118103</fpage>
          <pub-id pub-id-type="doi">10.1016/j.actamat.2022.118103</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B25">
        <label>25</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Ren</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Wei</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Lai</surname>
              <given-names>Q</given-names>
            </name>
            <name>
              <surname>Xu</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Building a quantitative composition-microstructure-property relationship of dual-phase steels via multimodal data mining</article-title>
          <source>Acta Mater</source>
          <year>2023</year>
          <volume>252</volume>
          <fpage>118954</fpage>
          <pub-id pub-id-type="doi">10.1016/j.actamat.2023.118954</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B26">
        <label>26</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Wu</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Torresi</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Hu</surname>
              <given-names>M</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Inverse design workflow discovers hole-transport materials tailored for perovskite solar cells</article-title>
          <source>Science</source>
          <year>2024</year>
          <volume>386</volume>
          <fpage>1256</fpage>
          <lpage>64</lpage>
          <pub-id pub-id-type="doi">10.1126/science.ads0901</pub-id>
          <pub-id pub-id-type="pmid">39666797</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B27">
        <label>27</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Xu</surname>
              <given-names>P</given-names>
            </name>
            <name>
              <surname>Chang</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Lu</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Lu</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Search for ABO<sub>3</sub> type ferroelectric perovskites with targeted multi-properties by machine learning strategies</article-title>
          <source>J Chem Inf Model</source>
          <year>2022</year>
          <volume>62</volume>
          <fpage>5038</fpage>
          <lpage>49</lpage>
          <pub-id pub-id-type="doi">10.1021/acs.jcim.1c00566</pub-id>
          <pub-id pub-id-type="pmid">34375112</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B28">
        <label>28</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>He</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>C</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Machine learning identified materials descriptors for ferroelectricity</article-title>
          <source>Acta Mater</source>
          <year>2021</year>
          <volume>209</volume>
          <fpage>116815</fpage>
          <pub-id pub-id-type="doi">10.1016/j.actamat.2021.116815</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B29">
        <label>29</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Min</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Cho</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Accelerated discovery of potential ferroelectric perovskite <italic>via</italic> active learning</article-title>
          <source>J Mater Chem C</source>
          <year>2020</year>
          <volume>8</volume>
          <fpage>7866</fpage>
          <lpage>72</lpage>
          <pub-id pub-id-type="doi">10.1039/d0tc00985g</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B30">
        <label>30</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Balachandran</surname>
              <given-names>PV</given-names>
            </name>
            <name>
              <surname>Kowalski</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Sehirlioglu</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Lookman</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Experimental search for high-temperature ferroelectric perovskites guided by two-step machine learning</article-title>
          <source>Nat Commun</source>
          <year>2018</year>
          <volume>9</volume>
          <fpage>1668</fpage>
          <pub-id pub-id-type="doi">10.1038/s41467-018-03821-9</pub-id>
          <pub-id pub-id-type="pmid">29700297</pub-id>
          <pub-id pub-id-type="pmcid">PMC5920103</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B31">
        <label>31</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Liu</surname>
              <given-names>Q</given-names>
            </name>
            <name>
              <surname>Polak</surname>
              <given-names>MP</given-names>
            </name>
            <name>
              <surname>Kim</surname>
              <given-names>SY</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Beyond designer’s knowledge: generating materials design hypotheses via a large language model</article-title>
          <source>Acta Mater</source>
          <year>2025</year>
          <volume>297</volume>
          <fpage>121307</fpage>
          <pub-id pub-id-type="doi">10.1016/j.actamat.2025.121307</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B32">
        <label>32</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Tian</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Jiang</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Steel design based on a large language model</article-title>
          <source>Acta Mater</source>
          <year>2025</year>
          <volume>285</volume>
          <fpage>120663</fpage>
          <pub-id pub-id-type="doi">10.1016/j.actamat.2024.120663</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B33">
        <label>33</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Wang</surname>
              <given-names>P</given-names>
            </name>
            <name>
              <surname>Jiang</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Liao</surname>
              <given-names>W</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Generalizable descriptors for automatic titanium alloys design by learning from texts via large language model</article-title>
          <source>Acta Mater</source>
          <year>2025</year>
          <volume>296</volume>
          <fpage>121275</fpage>
          <pub-id pub-id-type="doi">10.1016/j.actamat.2025.121275</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B34">
        <label>34</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Polak</surname>
              <given-names>MP</given-names>
            </name>
            <name>
              <surname>Morgan</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Extracting accurate materials data from research papers with conversational language models and prompt engineering</article-title>
          <source>Nat Commun</source>
          <year>2024</year>
          <volume>15</volume>
          <fpage>1569</fpage>
          <pub-id pub-id-type="doi">10.1038/s41467-024-45914-8</pub-id>
          <pub-id pub-id-type="pmid">38383556</pub-id>
          <pub-id pub-id-type="pmcid">PMC10882009</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B35">
        <label>35</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Senior</surname>
              <given-names>AW</given-names>
            </name>
            <name>
              <surname>Evans</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Jumper</surname>
              <given-names>J</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Improved protein structure prediction using potentials from deep learning</article-title>
          <source>Nature</source>
          <year>2020</year>
          <volume>577</volume>
          <fpage>706</fpage>
          <lpage>10</lpage>
          <pub-id pub-id-type="doi">10.1038/s41586-019-1923-7</pub-id>
          <pub-id pub-id-type="pmid">31942072</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B36">
        <label>36</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Tep</surname>
              <given-names>P</given-names>
            </name>
            <name>
              <surname>Bernacki</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>High-fidelity grain growth modeling: leveraging deep learning for fast computations</article-title>
          <source>Acta Mater</source>
          <year>2025</year>
          <volume>301</volume>
          <fpage>121486</fpage>
          <pub-id pub-id-type="doi">10.1016/j.actamat.2025.121486</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B37">
        <label>37</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Yang</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>C</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Deep learning-based X-ray computed tomography image reconstruction and prediction of compression behavior of 3D printed lattice structures</article-title>
          <source>Addit Manuf</source>
          <year>2022</year>
          <volume>54</volume>
          <fpage>102774</fpage>
          <pub-id pub-id-type="doi">10.1016/j.addma.2022.102774</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B38">
        <label>38</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Lundberg</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Lee</surname>
              <given-names>SI</given-names>
            </name>
          </person-group>
          <comment>A unified approach to interpreting model predictions. <italic>arXiv</italic> <bold>2017</bold>, arXiv:1705.07874. <uri xlink:href="https://doi.org/10.48550/arXiv.1705.07874">https://doi.org/10.48550/arXiv.1705.07874</uri>. (accessed 2026-05-21)</comment>
        </nlm-citation>
      </ref>
      <ref id="B39">
        <label>39</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Ribeiro</surname>
              <given-names>MT</given-names>
            </name>
            <name>
              <surname>Singh</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Guestrin</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <comment>“Why should I trust you?”: Explaining the predictions of any classifier. <italic>arXiv</italic> <bold>2016</bold>, arXiv:1602.04938. <uri xlink:href="https://doi.org/10.48550/arXiv.1602.04938">https://doi.org/10.48550/arXiv.1602.04938</uri>. (accessed 2026-05-21)</comment>
        </nlm-citation>
      </ref>
      <ref id="B40">
        <label>40</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Alibagheri</surname>
              <given-names>E</given-names>
            </name>
            <name>
              <surname>Ranjbar</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Khazaei</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Kühne</surname>
              <given-names>TD</given-names>
            </name>
            <name>
              <surname>Vaez Allaei</surname>
              <given-names>SM</given-names>
            </name>
          </person-group>
          <article-title>Remarkable optoelectronic characteristics of synthesizable square‐octagon haeckelite structures: machine learning materials discovery</article-title>
          <source>Adv Funct Mater</source>
          <year>2024</year>
          <volume>34</volume>
          <fpage>2402390</fpage>
          <pub-id pub-id-type="doi">10.1002/adfm.202402390</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B41">
        <label>41</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Sun</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Peng</surname>
              <given-names>RL</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Machine learning enabled the prediction of γ′-depleted depth during interdiffusion of bond-coated IN792 superalloy</article-title>
          <source>Surf Coat Technol</source>
          <year>2025</year>
          <volume>513</volume>
          <fpage>132448</fpage>
          <pub-id pub-id-type="doi">10.1016/j.surfcoat.2025.132448</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B42">
        <label>42</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Chen</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Hilhorst</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Bokas</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Gorsse</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Jacques</surname>
              <given-names>PJ</given-names>
            </name>
            <name>
              <surname>Hautier</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>A map of single-phase high-entropy alloys</article-title>
          <source>Nat Commun</source>
          <year>2023</year>
          <volume>14</volume>
          <fpage>2856</fpage>
          <pub-id pub-id-type="doi">10.1038/s41467-023-38423-7</pub-id>
          <pub-id pub-id-type="pmid">37208345</pub-id>
          <pub-id pub-id-type="pmcid">PMC10199023</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B43">
        <label>43</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Pearson</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>LIII. On lines and planes of closest fit to systems of points in space</article-title>
          <source>Lond Edinb Dublin Philos Mag J Sci</source>
          <year>1901</year>
          <volume>2</volume>
          <fpage>559</fpage>
          <lpage>72</lpage>
          <pub-id pub-id-type="doi">10.1080/14786440109462720</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B44">
        <label>44</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Srinivasan</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Broderick</surname>
              <given-names>SR</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>R</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Mapping chemical selection pathways for designing multicomponent alloys: an informatics framework for materials design</article-title>
          <source>Sci Rep</source>
          <year>2015</year>
          <volume>5</volume>
          <fpage>17960</fpage>
          <pub-id pub-id-type="doi">10.1038/srep17960</pub-id>
          <pub-id pub-id-type="pmid">26681142</pub-id>
          <pub-id pub-id-type="pmcid">PMC4683530</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B45">
        <label>45</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Tenenbaum</surname>
              <given-names>JB</given-names>
            </name>
            <name>
              <surname>de Silva</surname>
              <given-names>V</given-names>
            </name>
            <name>
              <surname>Langford</surname>
              <given-names>JC</given-names>
            </name>
          </person-group>
          <article-title>A global geometric framework for nonlinear dimensionality reduction</article-title>
          <source>Science</source>
          <year>2000</year>
          <volume>290</volume>
          <fpage>2319</fpage>
          <lpage>23</lpage>
          <pub-id pub-id-type="doi">10.1126/science.290.5500.2319</pub-id>
          <pub-id pub-id-type="pmid">11125149</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B46">
        <label>46</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>McInnes</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Healy</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Melville</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <comment>UMAP: uniform manifold approximation and projection for dimension reduction. <italic>arXiv</italic> <bold>2018</bold>, arXiv:1802.03426. <uri xlink:href="https://doi.org/10.48550/arXiv.1802.03426">https://doi.org/10.48550/arXiv.1802.03426</uri>. (accessed 2026-05-21)</comment>
        </nlm-citation>
      </ref>
      <ref id="B47">
        <label>47</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhao</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Lookman</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Yuan</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Closed-loop inverse design of high entropy alloys using symbolic regression-oriented optimization</article-title>
          <source>Mater Today</source>
          <year>2025</year>
          <volume>88</volume>
          <fpage>263</fpage>
          <lpage>71</lpage>
          <pub-id pub-id-type="doi">10.1016/j.mattod.2025.06.033</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B48">
        <label>48</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Xue</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Xue</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Yuan</surname>
              <given-names>R</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>An informatics approach to transformation temperatures of NiTi-based shape memory alloys</article-title>
          <source>Acta Mater</source>
          <year>2017</year>
          <volume>125</volume>
          <fpage>532</fpage>
          <lpage>41</lpage>
          <pub-id pub-id-type="doi">10.1016/j.actamat.2016.12.009</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B49">
        <label>49</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Pokorny</surname>
              <given-names>VJ</given-names>
            </name>
            <name>
              <surname>Sponheim</surname>
              <given-names>SR</given-names>
            </name>
            <name>
              <surname>Rawls</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Impact of reduced-dimensionality independent components analysis on event-related potential measurements</article-title>
          <source>Psychophysiology</source>
          <year>2023</year>
          <volume>60</volume>
          <fpage>e14223</fpage>
          <pub-id pub-id-type="doi">10.1111/psyp.14223</pub-id>
          <pub-id pub-id-type="pmid">36416715</pub-id>
          <pub-id pub-id-type="pmcid">PMC10085851</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B50">
        <label>50</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Miracle</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Senkov</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>A critical review of high entropy alloys and related concepts</article-title>
          <source>Acta Mater</source>
          <year>2017</year>
          <volume>122</volume>
          <fpage>448</fpage>
          <lpage>511</lpage>
          <pub-id pub-id-type="doi">10.1016/j.actamat.2016.08.081</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B51">
        <label>51</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Wen</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Phase prediction in high entropy alloys with a rational selection of materials descriptors and machine learning models</article-title>
          <source>Acta Mater</source>
          <year>2020</year>
          <volume>185</volume>
          <fpage>528</fpage>
          <lpage>39</lpage>
          <pub-id pub-id-type="doi">10.1016/j.actamat.2019.11.067</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B52">
        <label>52</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Machaka</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Motsi</surname>
              <given-names>GT</given-names>
            </name>
            <name>
              <surname>Raganya</surname>
              <given-names>LM</given-names>
            </name>
            <name>
              <surname>Radingoana</surname>
              <given-names>PM</given-names>
            </name>
            <name>
              <surname>Chikosha</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Machine learning-based prediction of phases in high-entropy alloys: a data article</article-title>
          <source>Data Brief</source>
          <year>2021</year>
          <volume>38</volume>
          <fpage>107346</fpage>
          <pub-id pub-id-type="doi">10.1016/j.dib.2021.107346</pub-id>
          <pub-id pub-id-type="pmid">34611534</pub-id>
          <pub-id pub-id-type="pmcid">PMC8477136</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B53">
        <label>53</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Xue</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Balachandran</surname>
              <given-names>PV</given-names>
            </name>
            <name>
              <surname>Hogden</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Theiler</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Xue</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Lookman</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Accelerated search for materials with targeted properties by adaptive design</article-title>
          <source>Nat Commun</source>
          <year>2016</year>
          <volume>7</volume>
          <fpage>11241</fpage>
          <pub-id pub-id-type="doi">10.1038/ncomms11241</pub-id>
          <pub-id pub-id-type="pmid">27079901</pub-id>
          <pub-id pub-id-type="pmcid">PMC4835535</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B54">
        <label>54</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Schölkopf</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Smola</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Müller</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Nonlinear component analysis as a kernel eigenvalue problem</article-title>
          <source>Neural Comput</source>
          <year>1998</year>
          <volume>10</volume>
          <fpage>1299</fpage>
          <lpage>319</lpage>
          <pub-id pub-id-type="doi">10.1162/089976698300017467</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B55">
        <label>55</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Roweis</surname>
              <given-names>ST</given-names>
            </name>
            <name>
              <surname>Saul</surname>
              <given-names>LK</given-names>
            </name>
          </person-group>
          <article-title>Nonlinear dimensionality reduction by locally linear embedding</article-title>
          <source>Science</source>
          <year>2000</year>
          <volume>290</volume>
          <fpage>2323</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1126/science.290.5500.2323</pub-id>
          <pub-id pub-id-type="pmid">11125150</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B56">
        <label>56</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Hefner</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Warren S. Torgerson, Theory and methods of scaling. New York: John Wiley and Sons, Inc., 1958. Pp. 460</article-title>
          <source>Syst Res</source>
          <year>1959</year>
          <volume>4</volume>
          <fpage>245</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1002/bs.3830040308</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B57">
        <label>57</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Tao</surname>
              <given-names>Q</given-names>
            </name>
            <name>
              <surname>Xu</surname>
              <given-names>P</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Lu</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Machine learning for perovskite materials design and discovery</article-title>
          <source>npj Comput Mater</source>
          <year>2021</year>
          <volume>7</volume>
          <fpage>495</fpage>
          <pub-id pub-id-type="doi">10.1038/s41524-021-00495-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B58">
        <label>58</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Lin</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Chen</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Liaw</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Solid‐solution phase formation rules for multi‐component alloys</article-title>
          <source>Adv Eng Mater</source>
          <year>2008</year>
          <volume>10</volume>
          <fpage>534</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1002/adem.200700240</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B59">
        <label>59</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Zuo</surname>
              <given-names>TT</given-names>
            </name>
            <name>
              <surname>Tang</surname>
              <given-names>Z</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Microstructures and properties of high-entropy alloys</article-title>
          <source>Prog Mater Sci</source>
          <year>2014</year>
          <volume>61</volume>
          <fpage>1</fpage>
          <lpage>93</lpage>
          <pub-id pub-id-type="doi">10.1016/j.pmatsci.2013.10.001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B60">
        <label>60</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zarinejad</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Dependence of transformation temperatures of NiTi‐based shape‐memory alloys on the number and concentration of valence electrons</article-title>
          <source>Adv Funct Mater</source>
          <year>2008</year>
          <volume>18</volume>
          <fpage>2789</fpage>
          <lpage>94</lpage>
          <pub-id pub-id-type="doi">10.1002/adfm.200701423</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B61">
        <label>61</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Fu</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Yu</surname>
              <given-names>Q</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Significant reduction of phase-transition hysteresis for magnetocaloric (La<sub>1-</sub><italic><sub>x</sub></italic>Ce<italic><sub>x</sub></italic>)<sub>2</sub>Fe<sub>11</sub>Si<sub>2</sub>H<italic><sub>y</sub></italic> alloys by microstructural manipulation</article-title>
          <source>Acta Mater</source>
          <year>2021</year>
          <volume>207</volume>
          <fpage>116687</fpage>
          <pub-id pub-id-type="doi">10.1016/j.actamat.2021.116687</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B62">
        <label>62</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Cheng</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Hong</surname>
              <given-names>M</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Orchestrating phase transition in GeTe thermoelectrics: an investigation into the role of electronegativity</article-title>
          <source>Nano Energy</source>
          <year>2024</year>
          <volume>127</volume>
          <fpage>109723</fpage>
          <pub-id pub-id-type="doi">10.1016/j.nanoen.2024.109723</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B63">
        <label>63</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zurcher</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Muller</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Sachslehner</surname>
              <given-names>F</given-names>
            </name>
            <name>
              <surname>Groger</surname>
              <given-names>V</given-names>
            </name>
            <name>
              <surname>Zehetbauer</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Dislocation resistivity in Cu: dependence of the deviations from Matthiessen’s rule on temperature, dislocation density and impurity content</article-title>
          <source>J Phys Condens Matter</source>
          <year>1995</year>
          <volume>7</volume>
          <fpage>3515</fpage>
          <lpage>28</lpage>
          <pub-id pub-id-type="doi">10.1088/0953-8984/7/18/016</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B64">
        <label>64</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Žnidarič</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Modified Matthiessen’s rule: more scattering leads to less resistance</article-title>
          <source>Phys Rev B</source>
          <year>2022</year>
          <volume>105</volume>
          <fpage>045140</fpage>
          <pub-id pub-id-type="doi">10.1103/physrevb.105.045140</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B65">
        <label>65</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Ho</surname>
              <given-names>CY</given-names>
            </name>
            <name>
              <surname>Ackerman</surname>
              <given-names>MW</given-names>
            </name>
            <name>
              <surname>Wu</surname>
              <given-names>KY</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Electrical resistivity of ten selected binary alloy systems</article-title>
          <source>J Phys Chem Ref Data</source>
          <year>1983</year>
          <volume>12</volume>
          <fpage>183</fpage>
          <lpage>322</lpage>
          <pub-id pub-id-type="doi">10.1063/1.555684</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>