﻿<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.0 20120330//EN" "http://jats.nlm.nih.gov/publishing/1.0/JATS-journalpublishing1.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="nlm-ta">J. Mater. Inf.</journal-id>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-title-group>
        <journal-title>Journal of Materials Informatics</journal-title>
      </journal-title-group>
      <issn pub-type="epub">2770-372X</issn>
      <publisher>
        <publisher-name>OAE Publishing Inc.</publisher-name>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.20517/jmi.2026.07</article-id>
      <article-categories>
        <subj-group>
          <subject>Review</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>A survey of agentic materials science and engineering: where are we and where are we going?</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author">
          <name>
            <surname>Zhu</surname>
            <given-names>Jiayi</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
          <xref ref-type="aff" rid="I#">
            <sup>#</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Zhang</surname>
            <given-names>Longhan</given-names>
          </name>
          <xref ref-type="aff" rid="I2">
            <sup>2</sup>
          </xref>
          <xref ref-type="aff" rid="I#">
            <sup>#</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Zhu</surname>
            <given-names>Yizhang</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Lin</surname>
            <given-names>Xiaotian</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Wu</surname>
            <given-names>Yifan</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Di</surname>
            <given-names>Shimin</given-names>
          </name>
          <xref ref-type="aff" rid="I3">
            <sup>3</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Liu</surname>
            <given-names>Bang</given-names>
          </name>
          <xref ref-type="aff" rid="I4">
            <sup>4</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author" corresp="yes">
          <name>
            <surname>Luo</surname>
            <given-names>Yuyu</given-names>
          </name>
          <xref ref-type="aff" rid="I1">
            <sup>1</sup>
          </xref>
          <xref ref-type="aff" rid="I*">
            <sup>*</sup>
          </xref>
          <xref ref-type="corresp" rid="cor1" />
          <contrib-id contrib-id-type="orcid">https://orcid.org/0000-0001-9530-3327</contrib-id>
        </contrib>
        <contrib contrib-type="author" corresp="yes">
          <name>
            <surname>Zhang</surname>
            <given-names>Tongyi</given-names>
          </name>
          <xref ref-type="aff" rid="I2">
            <sup>2</sup>
          </xref>
          <xref ref-type="aff" rid="I*">
            <sup>*</sup>
          </xref>
          <xref ref-type="corresp" rid="cor1" />
          <contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-9646-9668</contrib-id>
        </contrib>
      </contrib-group>
      <aff id="I1">
        <sup>1</sup>Data Science and Analytics Thrust, The Hong Kong University of Science and Technology (Guangzhou), Guangzhou 511453, Guangdong, China.</aff>
      <aff id="I2">
        <sup>2</sup>Advanced Materials Thrust, The Hong Kong University of Science and Technology (Guangzhou), Guangzhou 511453, Guangdong, China.</aff>
      <aff id="I3">
        <sup>3</sup>School of Computer Science and Engineering, Southeast University, Nanjing 211189, Jiangsu, China.</aff>
      <aff id="I4">
        <sup>4</sup>Department of Computer Science and Operations Research, University of Montreal, Montreal H3C 3J7, Canada.</aff>
      <aff id="I#">
        <sup>#</sup>Authors contributed equally.</aff>
      <author-notes>
        <corresp id="cor1"><sup>*</sup>Correspondence to: Prof. Tongyi Zhang, Advanced Materials Thrust, The Hong Kong University of Science and Technology (Guangzhou), Guangzhou 511453, Guangdong, China. E-mail: <email>mezhangt@hkust-gz.edu.cn</email>; Prof. Yuyu Luo, Data Science and Analytics Thrust, The Hong Kong University of Science and Technology (Guangzhou), Guangzhou 511453, Guangdong, China. E-mail: <email>yuyuluo@hkust-gz.edu.cn</email></corresp>
        <fn fn-type="other">
          <p>
            <bold>Received:</bold> 2 Mar 2026 | <bold>First Decision:</bold> 24 Mar 2026 | <bold>Revised:</bold> 7 Apr 2026 | <bold>Accepted:</bold> 30 Apr 2026 | <bold>Published:</bold> 26 May 2026</p>
        </fn>
        <fn fn-type="other">
          <p>
            <bold>Academic Editor:</bold> Xingjun Liu | <bold>Copy Editor:</bold> Pei-Yun Wang | <bold>Production Editor:</bold> Pei-Yun Wang</p>
        </fn>
      </author-notes>
      <pub-date pub-type="ppub">
        <year>2026</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>26</day>
        <month>5</month>
        <year>2026</year>
      </pub-date>
      <volume>6</volume>
      <issue>2</issue>
      <elocation-id>32</elocation-id>
      <permissions>
        <copyright-statement>© The Author(s) 2026.</copyright-statement>
        <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
          <license-p>© The Author(s) 2026. <bold>Open Access</bold> This article is licensed under a Creative Commons Attribution 4.0 International License (<uri xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</uri>), which permits unrestricted use, sharing, adaptation, distribution and reproduction in any medium or format, for any purpose, even commercially, as long as you give appropriate credit to the original author(s) and the source, provide a link to the Creative Commons license, and indicate if changes were made.</license-p>
        </license>
      </permissions>
      <abstract>
        <p>Agents, primarily built upon large language models (LLMs) and equipped with planning, tool use, memory, and self-reﬂection capabilities, are revolutionizing all aspects of materials science and engineering (MSE), from materials design and experimental execution to industrial manufacturing and deployment, thereby opening the age of agentic MSE. Rather than functioning as isolated artificial intelligence (AI) predictive models, these agents coordinate multi-step scientiﬁc workﬂows by retrieving and structuring knowledge, proposing and reﬁning hypotheses, planning experiments, combining multimodal simulations and characterizations, and, when integrated with AI materials laboratories, closing the loop toward autonomous materials discovery. However, agentic systems exhibit varying degrees of autonomy, and their roles in materials research and development diﬀer accordingly. To systematically examine the landscape of agentic MSE, this survey proposes a six-level autonomy framework (Levels 0-5) that characterizes the progression from human-only workﬂows to fully autonomous scientiﬁc agents. The framework aligns with key task families across the entire MSE pipeline, including information retrieval, property prediction, simulation, synthesis, and characterization. By reviewing recent advances in agentic MSE, we reveal uneven progress across these domains. Knowledge-centric capabilities often remain at an early stage, while experimental orchestration and characterization are starting to explore higher-level agent behaviors. Importantly, achieving mature autonomy requires coordinating multiple tasks rather than optimizing any single task in isolation. Collectively, these insights provide a structured roadmap for advancing agentic MSE toward higher levels of autonomy.</p>
      </abstract>
      <kwd-group>
        <kwd>Materials science and engineering</kwd>
        <kwd>large language models</kwd>
        <kwd>LLM-based agents</kwd>
        <kwd>agentic materials science and engineering</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec id="sec1">
      <title>INTRODUCTION</title>
      <p>Materials science and engineering (MSE) is an important discipline at the intersection of physics, chemistry, and engineering, aiming to understand the complex relationships among a material’s composition, structure, processing conditions, and resulting functional properties. In recent years, a wide range of data-driven and deep learning techniques have been explored across diverse materials contexts, focusing on specific research tasks that span the entire discovery pipeline. These efforts include natural language processing (NLP) for literature-based knowledge extraction, graph neural networks (GNNs)<sup>[<xref ref-type="bibr" rid="B1">1</xref>-<xref ref-type="bibr" rid="B6">6</xref>]</sup> for material representation learning and property prediction, generative models for inverse materials design<sup>[<xref ref-type="bibr" rid="B7">7</xref>,<xref ref-type="bibr" rid="B8">8</xref>]</sup>, and optimization algorithms for process path optimization. Meanwhile, key research tools in MSE are undergoing an AI-driven paradigm shift toward higher-throughput data generation, encompassing atomic- and molecular-level computations<sup>[<xref ref-type="bibr" rid="B9">9</xref>-<xref ref-type="bibr" rid="B11">11</xref>]</sup>, meso- and macro-scale simulations, autonomous characterization analysis, and autonomous high-throughput experimental platforms. Due to the diversity of material classes, such as metals, ceramics, polymers, semiconductors, and composites, as well as the inherently multimodal and multiscale nature of materials data, artificial intelligence (AI) for Materials Science and Engineering (AI4Mat) has emerged in a wide range of forms. Collectively, these developments converge toward a unified vision: the realization of an autonomous AI scientist deeply integrated into every stage of the materials research pipeline, enabling more efficient, accurate, and intelligent scientific discovery and materials innovation.</p>
      <sec id="sec1-1">
        <title>Agentic MSE</title>
        <p>The advent of large language models (LLMs) and LLM-based agents is the catalyst accelerating this vision. Unlike static predictive models, these agents are endowed with capabilities such as planning, memory, tool use, and self-reflection<sup>[<xref ref-type="bibr" rid="B12">12</xref>-<xref ref-type="bibr" rid="B14">14</xref>]</sup>. They can coordinate multi-step scientific workflows, including retrieving and structuring domain knowledge from literature, proposing and refining hypotheses, planning and parameterizing experiments, and invoking simulation or cheminformatics tools. When integrated with robotic platforms, agents can form a closed loop in material research by executing experiments in the physical world<sup>[<xref ref-type="bibr" rid="B15">15</xref>,<xref ref-type="bibr" rid="B16">16</xref>]</sup>. Early initiatives such as Coscientist<sup>[<xref ref-type="bibr" rid="B17">17</xref>]</sup> have demonstrated the autonomous design and execution of complex chemical tasks in both cloud-based and physical laboratory environments. Self-driving laboratories (SDLs), exemplified by A-Lab<sup>[<xref ref-type="bibr" rid="B18">18</xref>]</sup>, are advancing toward higher levels of autonomy by employing active learning approaches to sustain long-term automated synthesis and discovery cycles. Collectively, these innovations signal a paradigm shift from traditional model-centric methodologies to comprehensive agentic systems that integrate data resources, computational tools, and experimental hardware within a cohesive framework for autonomous materials research<sup>[<xref ref-type="bibr" rid="B19">19</xref>]</sup>.</p>
        <p>We refer to agentic MSE as an emerging research paradigm in which LLM-based agents actively participate in the materials research and development cycle. In this paradigm, agents do not merely predict properties or extract information; instead, they exhibit the ability to perceive the environment, plan multi-step actions, invoke external computational or experimental tools, remember and refine prior outcomes, and autonomously pursue scientific objectives under human oversight. This agentic perspective transforms materials informatics from a data-analysis discipline into an integrated system of reasoning, experimentation, and self-improvement. Consequently, agentic MSE, encompassing the design, evaluation, and governance of autonomous or semi-autonomous agents, presents considerable potential to accelerate discovery, ensure reproducibility, and facilitate collaboration with human scientists across all stages of materials research.</p>
        <p>These trends motivate a fundamental shift from isolated, task-specific modeling to a workflow-oriented systems perspective for materials discovery and development. In this emerging paradigm, data resources, computational tools, experimental platforms, and control policies are no longer disparate elements but components integrated through unified agentic orchestration.</p>
      </sec>
      <sec id="sec1-2">
        <title>A hierarchical framework for agentic MSE</title>
        <p>However, transitioning to such integrated systems reveals a significant challenge, as the progression toward autonomy is highly uneven across the diverse landscape of MSE. This domain comprises distinct task families, ranging from purely informational tasks such as literature retrieval to physically demanding tasks including experimental synthesis. Each family presents unique barriers related to reasoning complexity, tool integration, and safety constraints. This leads to a landscape where AI capabilities vary drastically, extending from simple assistance in one domain to fully autonomous control in another.</p>
        <p>To rigorously evaluate this heterogeneous progress, a simple catalog of individual models or a binary classification of automated <italic>vs.</italic> manual is insufficient. Such approaches fail to capture the nuance between a passive predictive model and an active reasoning agent. Therefore, we advocate examining the field through a hierarchical taxonomy that maps varying degrees of agent autonomy onto specific materials science tasks. Such a framework can provide a standardized metric for benchmarking progress. This methodology identifies not only where high autonomy has been achieved but also where critical gaps in reasoning and integration remain.</p>
        <p>Therefore, to capture the progressive evolution of agentic MSE, we adopt the six-level hierarchy shown in <xref ref-type="fig" rid="fig1">Figure 1</xref>. Similar to the Society of Automotive Engineers (SAE) levels<sup>[<xref ref-type="bibr" rid="B20">20</xref>]</sup> of driving automation, this framework describes a progression from full human control to increasingly autonomous system behavior. Each level specifies a characteristic combination of agent capabilities, human roles, and agent responsibilities, together tracing the transition from human-only execution to fully autonomous scientific discovery.</p>
        <fig id="fig1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Overview of the six-level hierarchy for agentic MSE and its task mapping. (A) Progression from human-only workflows (Level 0) to fully autonomous AI materials scientists (Level 5); (B) Achieved autonomy levels across five core materials science tasks. Established: multiple independently published systems have demonstrated the capability with reproducible methods; Prototype: at least one published system has demonstrated the capability, but replication and generalization remain limited; Exploratory: the capability has been partially demonstrated in isolated or constrained settings, without full end-to-end validation; Visionary: no existing system has yet demonstrated the capability, representing a long-term research objective. MSE: Materials science and engineering; AI: artificial intelligence; LLM: large language model.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jmi6007.fig.1.jpg" />
        </fig>
        <p>• Level 0 - Human-Only. This is the baseline stage of traditional research, in which humans act as the sole executors, manually performing literature reviews, hypothesis formation, and experimentation. At this stage, agents are not yet involved.</p>
        <p>• Level 1 - LLM-Assisted Analysis. Agents begin to play a purely supportive role in scientific workflows, essentially acting as intelligent research assistants or “copilots” for human scientists. At this stage, agents help retrieve information, summarize literature, and make simple predictions, but they do not take initiative or autonomously execute complex tasks. These systems excel at parsing scientific text and extracting structured knowledge<sup>[<xref ref-type="bibr" rid="B21">21</xref>]</sup>. However, their contributions remain advisory: they cannot yet plan multi-step experiments or make independent decisions, and any insights they provide still require human verification<sup>[<xref ref-type="bibr" rid="B22">22</xref>]</sup>.</p>
        <p>• Level 2 - Tool-Augmented Agent. Agents move beyond passive assistance and begin interacting with external tools to accomplish scientific tasks. At this stage, human researchers still define the overall goals, but agents can independently execute subtasks, such as retrieving data, running simulations, or invoking domain-specific libraries, without requiring step-by-step instructions. This tool-augmented paradigm enables agents to ground their reasoning in trusted computational resources, improving both reliability and scope. While humans remain responsible for high-level validation, agents can propose plausible synthesis routes and predict material properties by drawing on databases and simulators.</p>
        <p>• Level 3 - Collaborative Planner. Agents act as “conditionally automated” scientific assistants capable of autonomously planning multi-step tasks, although they still require human oversight at key decision points. Researchers provide high-level goals, and the agents use chain-of-thought reasoning<sup>[<xref ref-type="bibr" rid="B23">23</xref>]</sup>, long-term memory<sup>[<xref ref-type="bibr" rid="B24">24</xref>]</sup>, and tool invocation to autonomously decompose tasks and execute a series of actions.</p>
        <p>• Level 4 - Autonomous Laboratory Agent. Agents at this level are not only capable of autonomous planning but can also operate for extended periods while interacting with real experimental environments. With minimal human intervention, they can complete the closed loop from experimental design to execution and data collection. The agents can continuously maintain working memory, adjust experimental plans based on intermediate results, and directly control laboratory instruments or invoke remote experimental platforms (e.g., A-Lab<sup>[<xref ref-type="bibr" rid="B18">18</xref>]</sup>; lab orchestration software such as ChemOS 2.0<sup>[<xref ref-type="bibr" rid="B25">25</xref>]</sup>). Humans primarily act as high-level supervisors, intervening only at milestone checkpoints or when anomalies occur.</p>
        <p>• Level 5 - AI Materials Scientist. This stage represents the ultimate vision of a “fully autonomous” AI materials scientist. The agent can independently complete the entire scientific research cycle with virtually no human involvement, from formulating original hypotheses to planning research pathways, conducting physical experiments, and summarizing discoveries. Human input is limited to broad thematic directions, and research topics may even arise from the agent’s intrinsic “curiosity”.</p>
        <p>Progress from Level 1 to Level 5 can be characterized by transformative transitions that mark distinct expansions in capability and responsibility:<break/>• Level 1 → Level 2: Tool-Augmented Grounding. Agents advance from text-only analysis to grounded tool use, anchoring reasoning in materials databases, calculators, and simulators.<break/>• Level 2 → Level 3: Multi-Step Planning with Memory. Agents adopt persistent contextual memory and decompose complex goals into executable plans to advance from Level 2 to Level 3 autonomy, often through multi-agent planner-executor or generator-critic structures.<break/>• Level 3 → Level 4: Multi-Task Coordination and Physical Closed-Loop Control. Integration with robotics and instrumentation enables continuous operation across synthesis and characterization, pushing agents to Level 4 autonomy in materials research.<break/>• Level 4 → Level 5: Self-Reflection and Hypothesis-Driven Science. The envisioned Level 5 “AI materials scientist” autonomously formulates testable hypotheses and produces verifiable reasoning chains under audit and governance<sup>[<xref ref-type="bibr" rid="B26">26</xref>-<xref ref-type="bibr" rid="B28">28</xref>]</sup>.</p>
        <p>As summarized in <xref ref-type="fig" rid="fig1">Figure 1B</xref>, development is uneven across tasks: All the five tasks have achieved up to Level 3 autonomy. Synthesis and characterization have reached the Level 4 prototype stage, as pioneering systems such as Coscientist<sup>[<xref ref-type="bibr" rid="B17">17</xref>]</sup> and AdaptiveXRD<sup>[<xref ref-type="bibr" rid="B29">29</xref>]</sup> have demonstrated closed-loop operation with real physical instrumentation and robotic hardware. In contrast, knowledge-centric tasks (information retrieval and property prediction) in systems such as AccelMat<sup>[<xref ref-type="bibr" rid="B30">30</xref>]</sup> and MARS<sup>[<xref ref-type="bibr" rid="B31">31</xref>]</sup> and simulation remain exploratory at Level 4, as current systems operate exclusively in the digital domain without verified physical execution. <xref ref-type="fig" rid="fig1">Figure 1</xref> also serves as the organizational backbone of this survey: Section “THE HIERARCHY OF AUTONOMY IN MATERIALS SCIENCE AGENTS” follows this two-dimensional (2D) task–level matrix and discusses each task family vertically across autonomy levels.</p>
        <p>Prior surveys emphasize chemistry-centric model catalogs and case studies of LLMs and agents<sup>[<xref ref-type="bibr" rid="B22">22</xref>,<xref ref-type="bibr" rid="B32">32</xref>-<xref ref-type="bibr" rid="B34">34</xref>]</sup>. Recent surveys provide complementary but different perspectives. The AI4MS survey<sup>[<xref ref-type="bibr" rid="B35">35</xref>]</sup> mainly offers an inventory-style overview of foundation models for materials science, featuring a task-driven taxonomy across six application areas and a broad summary of unimodal models, multimodal models, LLM agents, datasets, and tools. In parallel, Li <italic>et al.</italic> review the rise of AI agents in materials research, highlighting advances in knowledge processing, structure design, and property calculation, and discussing how tool use and experimental automation may support SDLs and, eventually, end-to-end autonomous materials creation<sup>[<xref ref-type="bibr" rid="B36">36</xref>]</sup>. In contrast, our survey focuses on operationalizing autonomy<sup>[<xref ref-type="bibr" rid="B20">20</xref>]</sup> in a materials-grounded way: we introduce a six-level autonomy framework and a 2D task–level map spanning the materials research workflow. We further specify per-level capability requirements and toolchains, which serve as practical design targets for building materials agents toward higher autonomy, with Level 5 as the long-term objective.</p>
        <p>
          <bold>Our Contributions.</bold> We make the following contributions:</p>
        <p>• A materials-science-grounded six-level autonomy framework that characterizes the progression from human-only workflows to highly autonomous scientific agents. By defining explicit capability criteria, the framework clarifies the evolving division of labor between human scientists and AI, laying the foundation for a future research paradigm defined by seamless human-agent collaboration.</p>
        <p>• A structured background that establishes the research foundation for agentic materials science, comprising three components: a comparative analysis of traditional human-centered workflows and emerging agentic paradigms across the five core task families; a review of domain-specific foundation models and their development paradigms; and a synthesis of open-source agentic infrastructure. Together, these components define the current boundaries of what can be agentized in materials research.</p>
        <p>• A task–level matrix aligning autonomy levels with core materials tasks, revealing uneven development across literature understanding, prediction and design, simulation, synthesis, and characterization, and identifying research directions.</p>
        <p>• An analysis of key open challenges in agentic materials science, distinguishing cognition-centric limitations in digital reasoning tasks from execution-centric limitations in physical experimental workflows. Based on this analysis, we propose targeted research directions, including physically grounded reasoning, active perception for closed-loop experimentation, dynamic benchmarking, and safety and governance frameworks, providing a practical roadmap toward higher levels of autonomy.</p>
        <p>
          <bold>Paper Organization.</bold> The remainder of this survey is organized as follows. Section “BACKGROUND: TASK OVERVIEW AND RESEARCH FOUNDATIONS” lays the research foundation for agentic MSE from three angles: a comparison between traditional human-centered and emerging agentic workflows across the five core task families; a review of domain-specific foundation models and their development paradigms; and a synthesis of the open-source agentic infrastructure that collectively defines the current boundaries of what can be agentized. Section “THE HIERARCHY OF AUTONOMY IN MATERIALS SCIENCE AGENTS” constitutes the analytical core of the survey. Guided by the six-level autonomy framework, it examines each of the five task families vertically across autonomy levels, revealing both the maturity and the remaining gaps in each domain. Cross-task agents that integrate multiple task families are discussed at the end of this section. Section “FUTURE WORK” identifies current challenges and proposes targeted research directions.</p>
      </sec>
    </sec>
    <sec id="sec2">
      <title>BACKGROUND: TASK OVERVIEW AND RESEARCH FOUNDATIONS</title>
      <sec id="sec2-1">
        <title>Key task families across MSE research</title>
        <p>Before examining agentic systems at specific autonomy levels, we first establish the research foundations upon which they are built. This section introduces the five core task families that define the scope of MSE research, traces the workflow transformation from human-centered to agentic paradigms, and reviews the domain-specific foundation models and open-source infrastructure that collectively enable agentic behavior.</p>
        <p>To establish consistent terminology for the subsequent analysis, we formalize five fundamental tasks that collectively represent the core of materials research. Each task occupies a distinct position in the data–model–experiment cycle and serves as a target for progressive agentic autonomy.</p>
        <p>
          <bold>• Information Extraction (IE) and Hypothesis Generation</bold> focuses on extracting and structuring scientific knowledge from literature, patents, and databases. It converts unstructured textual, tabular, and graphical content into structured representations such as entities, relations, and process–property mappings. Based on the organized knowledge, agents generate scientifically grounded and testable hypotheses that guide downstream modeling and experimentation.</p>
        <p>
          <bold>• Property Prediction and Design</bold> focuses on learning predictive relationships among composition, structure, processing conditions, and resulting material properties. It includes forward modeling for property estimation from known descriptors and inverse design for discovering new materials that meet specified performance objectives while ensuring thermodynamic stability and synthetic feasibility.</p>
        <p>
          <bold>• Simulation and Multiscale Modeling</bold> integrates computational methods that operate across quantum, atomic, mesoscopic, and continuum scales. Its goal is to reproduce the physical, chemical, and mechanical behaviors of materials, connect phenomena across scales, and provide theoretical insights that complement and validate experimental results.</p>
        <p>
          <bold>• Automated Experimental Synthesis</bold> addresses the autonomous planning, execution, and optimization of synthesis workflows using robotic, microfluidic, or high-throughput experimental systems. Agents select synthesis routes, control equipment, monitor reactions in real time<sup>[<xref ref-type="bibr" rid="B17">17</xref>]</sup>, and adaptively adjust parameters through feedback from analytical measurements to achieve desired material outcomes with reproducibility and safety.</p>
        <p>
          <bold>• Characterization and Data Analysis</bold> involves the acquisition, preprocessing, and interpretation of experimental data obtained from characterization instruments such as X-ray diffraction (XRD), X-ray photoelectron spectroscopy (XPS), scanning electron microscopy/transmission electron microscopy (SEM/TEM), and spectroscopy. It includes automated noise removal, feature extraction, and quantitative identification of structural, compositional, and electronic characteristics. Advanced systems further employ active learning to optimize measurement strategies for maximal information gain.</p>
      </sec>
      <sec id="sec2-2">
        <title>From human-centered materials research to agentic workflows</title>
        <p>Building upon the definitions above and the proposed autonomy framework, <xref ref-type="fig" rid="fig2">Figure 2</xref> illustrates a fundamental transformation in MSE workflows. This schematic contrasts the traditional human-centric approach [all Subfigures (a) of <xref ref-type="fig" rid="fig2">Figure 2</xref>], characteristic of Level 0 and Level 1 autonomy, with the emerging agentic MSE research paradigm [all Subfigures (b) of <xref ref-type="fig" rid="fig2">Figure 2</xref>].</p>
        <fig id="fig2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Comparative overview of materials research workflows: traditional methods <italic>vs.</italic> agentic approaches across five representative tasks: (1) IE and hypothesis generation, (2) property prediction and design, (3) simulation and multiscale modeling, (4) automated experimental synthesis, and (5) characterization and data analysis. In each panel, the left side shows a conventional human-driven workflow, while the right side illustrates an agentic alternative in which AI agents coordinate planning, knowledge integration, tool invocation, and iterative analysis. IE: Information extraction; AI: artificial intelligence; NLP: natural language processing; KG: knowledge graph; DFT: density functional theory; FEM: finite element method; HPC: high performance computing; APIs: application programming interfaces.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jmi6007.fig.2.jpg" />
        </fig>
        <p>In prior MSE workflows, research tasks are mostly linear and handled separately. As illustrated in the left panel [all Subfigures (a) of <xref ref-type="fig" rid="fig2">Figure 2</xref>], the human scientist serves as the sole central processor who manually defines objectives, designs experiments, executes protocols, and interprets data. Feedback loops, such as redesigning synthesis routes or refining hypotheses, relied entirely on human intuition and manual intervention<sup>[<xref ref-type="bibr" rid="B37">37</xref>,<xref ref-type="bibr" rid="B38">38</xref>]</sup>. This bottleneck restricts discovery throughput and often disconnects high-level reasoning from low-level execution. Similarly, in computational domains such as simulation and characterization, data processing software operates as passive utilities that require continuous manual calibration and file manipulation.</p>
        <p>Central to the agentic paradigm is the shift from fragmented manual steps to integrated reasoning and planning. In this framework, AI agents serve as orchestration hubs that actively perceive contextual information and formulate multi-stage strategies. As demonstrated in all subfigures (b) of <xref ref-type="fig" rid="fig2">Figure 2</xref>, the agent acts as a dynamic hub that seamlessly integrates external resources, ranging from internet application programming interfaces (APIs) and computational simulators to physical laboratory instruments<sup>[<xref ref-type="bibr" rid="B17">17</xref>,<xref ref-type="bibr" rid="B39">39</xref>]</sup>. This integration transforms previously independent software tools and hardware systems into active modules under agentic control. Most importantly, this architecture establishes autonomous feedback loops. Whether performing inverse design for property prediction or optimizing synthesis parameters in real time, the system iteratively refines its actions. By analyzing output data to automatically trigger redesigns or next-step suggestions, the agentic workflow closes the loop between decision making and execution, significantly reducing the need for continuous human oversight.</p>
      </sec>
      <sec id="sec2-3">
        <title>Foundation models for MSE agents</title>
        <p>While autonomous agents coordinate workflows, make decisions, and interact with tools, these actions ultimately depend on the expressive power and inductive biases of underlying models. These models encode scientific knowledge, structure–property relationships, and implicit physical constraints that shape how an agent interprets information and takes actions. Before discussing agentic works within specific materials science tasks, we therefore review the foundation models upon which agentic systems are built. We first outline the distinct philosophies guiding the development of domain-specific LLMs for MSE, and then summarize representative models across key materials sub-domains.</p>
        <sec id="sec2-3-1">
          <title>Development paradigms of domain-specific LLMs</title>
          <p>Efforts to adapt LLMs to MSE can be grouped into several methodological families. Each family corresponds to a different view on how domain specialization should be integrated into general language models, and each involves different trade-offs in model capability, generalization, and computational cost.</p>
          <p>Continued pretraining<break/>Current LLMs are pretrained on extensive and diverse text corpora. To further develop generalized scientific priors in a specific domain of interest, continued pretraining (CPT) is a key strategy. In this approach, established LLMs are further exposed to vast corpora of scientific texts, databases, and structured materials knowledge before being adapted to downstream tasks. Models such as MatSciBERT<sup>[<xref ref-type="bibr" rid="B40">40</xref>]</sup> and MatBERT<sup>[<xref ref-type="bibr" rid="B41">41</xref>]</sup> follow this path. Specifically, MatSciBERT is a materials-aware BERT model initialized from SciBERT and further pretrained on a large curated corpus (around 285M words) of MSE literature. Using RoBERTa-<InlineParagraph>style<sup>[<xref ref-type="bibr" rid="B42">42</xref>]</sup></InlineParagraph> pretraining and domain-adaptive continuation, it achieves lower validation perplexity and state-of-the-art performance across three downstream tasks. Compared to general-purpose pretrained LLMs, these studies<sup>[<xref ref-type="bibr" rid="B40">40</xref>,<xref ref-type="bibr" rid="B41">41</xref>]</sup> focus on scientific domains, particularly MSE. They typically require millions of domain-specific documents for models to learn statistical structures in materials knowledge, including composition-structure-property relationships, synthesis terminology, and common experimental or theoretical narratives. The learned prior knowledge is beneficial not only for NLP tasks but also for intelligent agent applications, where pretrained models serve as the core of decision making and are integrated into simulation or experimental workflows.</p>
          <p>Supervised fine-tuning<break/>Since CPT requires large-scale domain data, which may be unavailable in niche areas, supervised fine-tuning (SFT) provides an alternative strategy for domain adaptation. In this approach, curated labeled datasets targeting specific downstream tasks are constructed, such as property prediction<sup>[<xref ref-type="bibr" rid="B43">43</xref>]</sup>, materials entity extraction<sup>[<xref ref-type="bibr" rid="B40">40</xref>]</sup>, and reaction prediction<sup>[<xref ref-type="bibr" rid="B44">44</xref>]</sup>. These datasets are then used to fine-tune pretrained LLMs in a supervised manner. In the field of MSE, SFT is widely used to endow models with task-specific capabilities that cannot be effectively learned from unlabeled corpora alone. Task-centric SFT has been applied to models such as PolySea<sup>[<xref ref-type="bibr" rid="B45">45</xref>]</sup> and SteelBERT<sup>[<xref ref-type="bibr" rid="B46">46</xref>]</sup>, enabling them to perform domain-specific tasks. However, these models risk lacking generalization capabilities beyond the scope of predefined tasks.</p>
          <p>Reinforcement learning<break/>Reinforcement learning (RL) has been prevailing in aligning LLMs with specific preferences or human feedback. It also provides a more dynamic paradigm for the decision making and iterative reasoning requirements of agentic materials workflows. In this framework, reward signals, including human preferences, rule-based evaluators, or self-consistency critics, will be constructed in the RL framework to evaluate LLM outputs and provide reward feedback for policy optimization. By rewarding coherent and actionable reasoning, RL enhances the ability of LLMs to meet the requirements of higher autonomy in agents operating in closed-loop computational or experimental environments.</p>
        </sec>
        <sec id="sec2-3-2">
          <title>Sub-domain specialized models</title>
          <p>
            <xref ref-type="table" rid="t1">Table 1</xref> presents representative models created within various materials science subfields. These models demonstrate practical implementations of the described methodological paradigms and highlight methodological diversity across the discipline. They include tailored models that incorporate priors for various material classes, including molecules<sup>[<xref ref-type="bibr" rid="B47">47</xref>-<xref ref-type="bibr" rid="B49">49</xref>]</sup>, polymers<sup>[<xref ref-type="bibr" rid="B45">45</xref>,<xref ref-type="bibr" rid="B50">50</xref>,<xref ref-type="bibr" rid="B51">51</xref>]</sup>, alloys<sup>[<xref ref-type="bibr" rid="B46">46</xref>,<xref ref-type="bibr" rid="B52">52</xref>]</sup>, perovskites<sup>[<xref ref-type="bibr" rid="B53">53</xref>]</sup>, batteries<sup>[<xref ref-type="bibr" rid="B54">54</xref>]</sup>, optical materials<sup>[<xref ref-type="bibr" rid="B55">55</xref>]</sup>, and catalysts<sup>[<xref ref-type="bibr" rid="B56">56</xref>]</sup>. Unlike general-purpose LLMs designed to capture broad conceptual patterns, these models utilize domain-specific CPT or fine-tuning to capture chemical, structural, and processing features unique to each material category. Consequently, sub-domain LLMs provide more robust results compared to generalist models in downstream applications.</p>
          <table-wrap id="t1">
            <label>Table 1</label>
            <caption>
              <p>Representative sub-domain specialized LLMs in MSE</p>
            </caption>
            <table frame="hsides" rules="groups">
              <thead>
                <tr>
                  <td style="border-bottom:1;">
                    <bold>Model</bold>
                  </td>
                  <td style="border-bottom:1;">
                    <bold>Sub-domain</bold>
                  </td>
                  <td style="border-bottom:1;">
                    <bold>Approach</bold>
                  </td>
                  <td style="border-bottom:1;">
                    <bold>Data scale</bold>
                  </td>
                  <td style="border-bottom:1;">
                    <bold>Modalities</bold>
                  </td>
                  <td style="border-bottom:1;">
                    <bold>Agentic usage</bold>
                  </td>
                </tr>
              </thead>
              <tbody>
                <tr>
                  <td>MatSciBERT<sup>[<xref ref-type="bibr" rid="B40">40</xref>]</sup></td>
                  <td>General</td>
                  <td>CPT</td>
                  <td>3.45B words</td>
                  <td>Text</td>
                  <td>Core models</td>
                </tr>
                <tr>
                  <td>MaterialBERT<sup>[<xref ref-type="bibr" rid="B6">6</xref>]</sup></td>
                  <td>General</td>
                  <td>CPT</td>
                  <td>8.4M entries</td>
                  <td>Text</td>
                  <td>Core models</td>
                </tr>
                <tr>
                  <td>MatterChat<sup>[<xref ref-type="bibr" rid="B57">57</xref>]</sup></td>
                  <td>General</td>
                  <td>Pretrain + SFT</td>
                  <td>142K samples</td>
                  <td>Text + molecular</td>
                  <td>Agentic tools</td>
                </tr>
                <tr>
                  <td>LLaMat-Chat<sup>[<xref ref-type="bibr" rid="B33">33</xref>]</sup></td>
                  <td>General</td>
                  <td>CPT + SFT</td>
                  <td>30B tokens</td>
                  <td>Text</td>
                  <td>Core models</td>
                </tr>
                <tr>
                  <td>LLaMat-CIF<sup>[<xref ref-type="bibr" rid="B33">33</xref>]</sup></td>
                  <td>Crystal</td>
                  <td>CPT + SFT</td>
                  <td>7M structures</td>
                  <td>Text + CIF</td>
                  <td>Agentic tools</td>
                </tr>
                <tr>
                  <td>CrystalLLM<sup>[<xref ref-type="bibr" rid="B58">58</xref>]</sup></td>
                  <td>Crystal</td>
                  <td>Pretrain</td>
                  <td>2.3M structures</td>
                  <td>Text + CIF</td>
                  <td>Agentic tools</td>
                </tr>
                <tr>
                  <td>Mol-LLM<sup>[<xref ref-type="bibr" rid="B47">47</xref>]</sup></td>
                  <td>Molecules</td>
                  <td>SFT + RL</td>
                  <td>3.3M samples</td>
                  <td>Text + molecular</td>
                  <td>Agentic tools</td>
                </tr>
                <tr>
                  <td>BindGPT<sup>[<xref ref-type="bibr" rid="B48">48</xref>]</sup></td>
                  <td>Molecules</td>
                  <td>Pretrain + SFT + RL</td>
                  <td>200M samples</td>
                  <td>Text + molecular</td>
                  <td>Agentic tools</td>
                </tr>
                <tr>
                  <td>ChemMLLM<sup>[<xref ref-type="bibr" rid="B49">49</xref>]</sup></td>
                  <td>Molecules</td>
                  <td>SFT</td>
                  <td>400K entries</td>
                  <td>Text + molecular + image</td>
                  <td>Agentic tools</td>
                </tr>
                <tr>
                  <td>BatGPT-Chem<sup>[<xref ref-type="bibr" rid="B59">59</xref>]</sup></td>
                  <td>Molecules</td>
                  <td>SFT</td>
                  <td>112K entries</td>
                  <td>Text + molecular</td>
                  <td>Core models</td>
                </tr>
                <tr>
                  <td>PolySea<sup>[<xref ref-type="bibr" rid="B45">45</xref>]</sup></td>
                  <td>Polymers</td>
                  <td>SFT</td>
                  <td>230K samples</td>
                  <td>Text + molecular</td>
                  <td>Core models</td>
                </tr>
                <tr>
                  <td>PolyBERT<sup>[<xref ref-type="bibr" rid="B50">50</xref>]</sup></td>
                  <td>Polymers</td>
                  <td>Pretrain + SFT</td>
                  <td>100M samples</td>
                  <td>Molecular</td>
                  <td>Agentic tools</td>
                </tr>
                <tr>
                  <td>TransPolymer<sup>[<xref ref-type="bibr" rid="B51">51</xref>]</sup></td>
                  <td>Polymers</td>
                  <td>Pretrain + SFT</td>
                  <td>5M samples</td>
                  <td>Text + molecular</td>
                  <td>Agentic tools</td>
                </tr>
                <tr>
                  <td>SteelBERT<sup>[<xref ref-type="bibr" rid="B46">46</xref>]</sup></td>
                  <td>Alloys</td>
                  <td>Pretrain + SFT</td>
                  <td>0.96B words</td>
                  <td>Text + tables</td>
                  <td>Core models</td>
                </tr>
                <tr>
                  <td>AlloyBERT<sup>[<xref ref-type="bibr" rid="B52">52</xref>]</sup></td>
                  <td>Alloys</td>
                  <td>SFT</td>
                  <td>1K samples</td>
                  <td>Text</td>
                  <td>Agentic tools</td>
                </tr>
                <tr>
                  <td>Perovskite-LLM<sup>[<xref ref-type="bibr" rid="B53">53</xref>]</sup></td>
                  <td>Perovskites</td>
                  <td>SFT</td>
                  <td>4.4M tokens</td>
                  <td>Text</td>
                  <td>Core models</td>
                </tr>
                <tr>
                  <td>BatteryBERT<sup>[<xref ref-type="bibr" rid="B54">54</xref>]</sup></td>
                  <td>Battery materials</td>
                  <td>Pretrain + CPT + SFT</td>
                  <td>3.3B tokens</td>
                  <td>Text</td>
                  <td>Core models</td>
                </tr>
                <tr>
                  <td>OpticalBERT<sup>[<xref ref-type="bibr" rid="B55">55</xref>]</sup></td>
                  <td>Optical materials</td>
                  <td>Pretrain + CPT + SFT</td>
                  <td>2.92B tokens</td>
                  <td>Text + tables</td>
                  <td>Core models</td>
                </tr>
                <tr>
                  <td>CatGPT<sup>[<xref ref-type="bibr" rid="B56">56</xref>]</sup></td>
                  <td>Catalysts</td>
                  <td>Pretrain + SFT</td>
                  <td>2M structures</td>
                  <td>Text-encoded structures</td>
                  <td>Agentic tools</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn>
                <p>LLMs: Large language models; MSE: materials science and engineering; CPT: continued pretraining; SFT: supervised fine-tuning; RL: reinforcement learning; Core models: models that may participate in reasoning and decision making within agentic systems; Agentic tools: models that may be invoked to execute specific tasks.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
          <p>In agentic systems, these domain-specific priors make such models appropriate for incorporation into materials science workflows. Depending on their role, they may function as cognitive components for decision making, planning, and reasoning, or as execution tools such as property predictors, structure analyzers, or simulation surrogates. Accordingly, we categorize the models in <xref ref-type="table" rid="t1">Table 1</xref> into “Core Models” and “Agentic Tools” to better reflect their functional roles within agentic systems.</p>
        </sec>
      </sec>
      <sec id="sec2-4">
        <title>Agentic infrastructures for materials science</title>
        <p>Beyond domain-specific models, recent progress in agentic MSE also depends on a broader infrastructure layer that supports information access, state tracking, planning, execution, and evaluation. Most of these open-source resources are not agentic in themselves. Instead, as shown in <xref ref-type="table" rid="t2">Table 2</xref>, they provide callable components that LLM-based agents can invoke and coordinate to build scientific workflows. Importantly, these infrastructures do more than support engineering integration; they also instantiate the core mechanisms that make agentic scientific workflows possible, including retrieval and grounding, memory persistence, task decomposition, tool routing, execution control, and feedback-driven correction. In this sense, they externalize recurring steps in materials research into reusable computational modules and define much of what can be agentized with current infrastructure. <xref ref-type="table" rid="t2">Table 2</xref> summarizes representative resources together with the scientific functions they support across knowledge, planning, execution, and evaluation.</p>
        <table-wrap id="t2">
          <label>Table 2</label>
          <caption>
            <p>Representative resources supporting core functional components of agentic MSE</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Resource category</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Representative tools or platforms</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Scientific role in materials research</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td rowspan="7">Knowledge/memory</td>
                <td>Materials Project<sup>[<xref ref-type="bibr" rid="B60">60</xref>]</sup>, Materials Cloud<sup>[<xref ref-type="bibr" rid="B61">61</xref>]</sup>, NOMAD<sup>[<xref ref-type="bibr" rid="B62">62</xref>]</sup>, AFLOW<sup>[<xref ref-type="bibr" rid="B63">63</xref>]</sup></td>
                <td>Knowledge retrieval &amp; structured scientific data hub</td>
              </tr>
              <tr>
                <td>MatKG<sup>[<xref ref-type="bibr" rid="B64">64</xref>]</sup>, MGED-KG<sup>[<xref ref-type="bibr" rid="B65">65</xref>]</sup>, MeKG<sup>[<xref ref-type="bibr" rid="B66">66</xref>]</sup></td>
                <td>Materials KGs &amp; Entity–relation storage</td>
              </tr>
              <tr>
                <td>MongoDB<sup>[<xref ref-type="bibr" rid="B67">67</xref>]</sup>, PostgreSQL<sup>[<xref ref-type="bibr" rid="B68">68</xref>]</sup></td>
                <td>Data storage</td>
              </tr>
              <tr>
                <td>EMMO<sup>[<xref ref-type="bibr" rid="B69">69</xref>]</sup>, ONTORULE<sup>[<xref ref-type="bibr" rid="B70">70</xref>]</sup>, SLACKS<sup>[<xref ref-type="bibr" rid="B71">71</xref>]</sup></td>
                <td>Domain ontologies</td>
              </tr>
              <tr>
                <td>FAISS<sup>[<xref ref-type="bibr" rid="B72">72</xref>]</sup>, Milvus<sup>[<xref ref-type="bibr" rid="B73">73</xref>]</sup>, Qdrant<sup>[<xref ref-type="bibr" rid="B74">74</xref>]</sup>, Weaviate<sup>[<xref ref-type="bibr" rid="B75">75</xref>]</sup></td>
                <td>Semantic storage &amp; vector similarity search</td>
              </tr>
              <tr>
                <td>Neo4j<sup>[<xref ref-type="bibr" rid="B76">76</xref>]</sup>, RDFLib<sup>[<xref ref-type="bibr" rid="B77">77</xref>]</sup>, Letta (MemGPT)<sup>[<xref ref-type="bibr" rid="B78">78</xref>]</sup></td>
                <td>Graph-based knowledge storage</td>
              </tr>
              <tr>
                <td>LlamaIndex<sup>[<xref ref-type="bibr" rid="B79">79</xref>]</sup>, Haystack<sup>[<xref ref-type="bibr" rid="B80">80</xref>]</sup>, SerpAPI<sup>[<xref ref-type="bibr" rid="B81">81</xref>]</sup></td>
                <td>Retrieval-augmented document search</td>
              </tr>
              <tr>
                <td rowspan="2">Decision/planning</td>
                <td>LangChain<sup>[<xref ref-type="bibr" rid="B82">82</xref>]</sup>, LangGraph<sup>[<xref ref-type="bibr" rid="B83">83</xref>]</sup>, AutoGen<sup>[<xref ref-type="bibr" rid="B84">84</xref>]</sup>, CrewAI<sup>[<xref ref-type="bibr" rid="B85">85</xref>]</sup></td>
                <td>Agentic orchestration &amp; logic workflow construction</td>
              </tr>
              <tr>
                <td>ReAct<sup>[<xref ref-type="bibr" rid="B86">86</xref>]</sup>, Reflexion<sup>[<xref ref-type="bibr" rid="B87">87</xref>]</sup></td>
                <td>Iterative reasoning and self-reflection</td>
              </tr>
              <tr>
                <td rowspan="5">Execution/action</td>
                <td>Fireworks<sup>[<xref ref-type="bibr" rid="B88">88</xref>]</sup>, AiiDA<sup>[<xref ref-type="bibr" rid="B89">89</xref>]</sup>, Simmate<sup>[<xref ref-type="bibr" rid="B90">90</xref>]</sup>, Colmena<sup>[<xref ref-type="bibr" rid="B91">91</xref>]</sup>, pymatgen<sup>[<xref ref-type="bibr" rid="B92">92</xref>]</sup></td>
                <td>Simulation workflow engines</td>
              </tr>
              <tr>
                <td>VASP<sup>[<xref ref-type="bibr" rid="B93">93</xref>]</sup>, Quantum Espresso<sup>[<xref ref-type="bibr" rid="B94">94</xref>]</sup>, ABINIT<sup>[<xref ref-type="bibr" rid="B95">95</xref>]</sup>, GPAW<sup>[<xref ref-type="bibr" rid="B96">96</xref>]</sup></td>
                <td>Simulation engines &amp; Python interfaces for DFT</td>
              </tr>
              <tr>
                <td>LAMMPS<sup>[<xref ref-type="bibr" rid="B97">97</xref>]</sup>, GROMACS<sup>[<xref ref-type="bibr" rid="B98">98</xref>]</sup>, OpenMM<sup>[<xref ref-type="bibr" rid="B99">99</xref>]</sup></td>
                <td>MD &amp; interatomic models</td>
              </tr>
              <tr>
                <td>PyVISA<sup>[<xref ref-type="bibr" rid="B100">100</xref>]</sup>, RoboRXN<sup>[<xref ref-type="bibr" rid="B101">101</xref>]</sup>, PyLabRobot<sup>[<xref ref-type="bibr" rid="B102">102</xref>]</sup></td>
                <td>Automated experiment execution</td>
              </tr>
              <tr>
                <td>Pydantic-AI<sup>[<xref ref-type="bibr" rid="B103">103</xref>]</sup></td>
                <td>Workflow scheduling and automation</td>
              </tr>
              <tr>
                <td rowspan="2">Evaluation/feedback</td>
                <td>MatSciBench<sup>[<xref ref-type="bibr" rid="B104">104</xref>]</sup>, MSQA<sup>[<xref ref-type="bibr" rid="B105">105</xref>]</sup>, MatTools<sup>[<xref ref-type="bibr" rid="B106">106</xref>]</sup>, ALDBench<sup>[<xref ref-type="bibr" rid="B107">107</xref>]</sup>, MatBench Discovery<sup>[<xref ref-type="bibr" rid="B108">108</xref>]</sup>, RxnBench<sup>[<xref ref-type="bibr" rid="B109">109</xref>]</sup>, SDE<sup>[<xref ref-type="bibr" rid="B110">110</xref>]</sup>, SFE<sup>[<xref ref-type="bibr" rid="B111">111</xref>]</sup></td>
                <td>Domain benchmarks</td>
              </tr>
              <tr>
                <td>LangSmith<sup>[<xref ref-type="bibr" rid="B112">112</xref>]</sup>, OpenAI Evals<sup>[<xref ref-type="bibr" rid="B113">113</xref>]</sup>, Ragas<sup>[<xref ref-type="bibr" rid="B114">114</xref>]</sup></td>
                <td>General evaluation frameworks and platforms</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>MSE: Materials science and engineering; KGs: knowledge graphs; DFT: density functional theory; MD: molecular dynamics; AI: artificial intelligence.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>Knowledge and memory<break/>Materials science research depends heavily on the scientific literature and diverse data resources including materials databases, simulation outputs, and experimental records. Researchers often need to review extensive papers, database entries, and experimental records to summarize existing findings and identify material systems and key parameters<sup>[<xref ref-type="bibr" rid="B115">115</xref>]</sup>. Agent-based systems require not only access to information, but also mechanisms for grounding their decisions in structured scientific evidence. In practice, this ability is enabled by a combination of retrieval-augmented generation (RAG), semantic similarity search, graph-based relation storage, and memory modules that preserve intermediate findings across workflow steps. For example, agents may retrieve structures, properties, phase stability data, or prior computational results from resources such as the Materials Project<sup>[<xref ref-type="bibr" rid="B60">60</xref>]</sup> and Materials Cloud<sup>[<xref ref-type="bibr" rid="B61">61</xref>]</sup>, and then store relevant constraints or candidate information for later reasoning<sup>[<xref ref-type="bibr" rid="B62">62</xref>,<xref ref-type="bibr" rid="B63">63</xref>]</sup>. More broadly, vector databases<sup>[<xref ref-type="bibr" rid="B72">72</xref>-<xref ref-type="bibr" rid="B75">75</xref>]</sup>, knowledge graphs (KGs)<sup>[<xref ref-type="bibr" rid="B64">64</xref>-<xref ref-type="bibr" rid="B66">66</xref>]</sup>, ontology systems<sup>[<xref ref-type="bibr" rid="B69">69</xref>-<xref ref-type="bibr" rid="B71">71</xref>]</sup>, and general-purpose data storage solutions such as MongoDB<sup>[<xref ref-type="bibr" rid="B67">67</xref>]</sup> and PostgreSQL<sup>[<xref ref-type="bibr" rid="B68">68</xref>]</sup> help connect scientific entities, conditions, and relationships across different sources. These mechanisms are important because materials workflows often require agents to accumulate evidence across multiple documents and data modalities rather than relying on a single query or static context. Other commonly used tools<sup>[<xref ref-type="bibr" rid="B76">76</xref>-<xref ref-type="bibr" rid="B81">81</xref>]</sup> are summarized in <xref ref-type="table" rid="t2">Table 2</xref>.</p>
        <p>Decision and planning<break/>In agent-driven materials research, a key challenge is to turn a broad scientific goal into a clear sequence of steps, and to keep the workflow consistent as new results appear. Agents must translate open-ended goals, such as identifying stable candidate materials or proposing synthesis conditions, into tractable substeps; maintain workflow state as new evidence appears; and revise plans when intermediate results are invalid, incomplete, or scientifically uninformative. These capabilities are commonly supported by mechanisms such as task decomposition, graph-structured workflow control, tool routing, reflection, and role-based multi-agent coordination. Frameworks such as LangChain<sup>[<xref ref-type="bibr" rid="B82">82</xref>]</sup> and LangGraph<sup>[<xref ref-type="bibr" rid="B83">83</xref>]</sup> support this process by providing building blocks to design multi-step agent workflows, connect external tools (such as databases, search engines, and code execution environments), and manage information flow between steps. They also help coordinate multiple roles or agents, enabling tasks such as literature search, data analysis, and result checking to be organized into a single pipeline. Beyond orchestration frameworks, the underlying reasoning algorithms are equally important. ReAct<sup>[<xref ref-type="bibr" rid="B86">86</xref>]</sup> enables agents to interleave reasoning and tool use across workflow steps, allowing them to iteratively refine hypotheses based on external evidence and execution feedback. Reflexion<sup>[<xref ref-type="bibr" rid="B87">87</xref>]</sup> further adds a self-reflection step, in which agents use feedback from earlier failures to improve subsequent decisions. This is particularly useful in multi-step materials workflows, where early errors in candidate selection, parameter setting, or intermediate result interpretation may affect later stages. <xref ref-type="table" rid="t2">Table 2</xref> provides additional tools and frameworks<sup>[<xref ref-type="bibr" rid="B84">84</xref>,<xref ref-type="bibr" rid="B85">85</xref>]</sup>.</p>
        <p>Execution and actions<break/>After planning, agents also need reliable mechanisms to execute actions and obtain scientifically meaningful feedback from the environment. In materials workflows, execution is not limited to calling generic APIs; it often requires parameterizing simulations, launching structured workflows, managing intermediate artifacts, and coupling language-level reasoning with numerical or experimental engines. Workflow managers and execution interfaces allow agents to organize computational jobs, pass structured inputs, monitor execution status, and collect outputs for downstream reasoning. They can also interface with common simulation codes<sup>[<xref ref-type="bibr" rid="B88">88</xref>-<xref ref-type="bibr" rid="B92">92</xref>]</sup>, <italic>ab initio</italic> calculation packages<sup>[<xref ref-type="bibr" rid="B93">93</xref>-<xref ref-type="bibr" rid="B96">96</xref>]</sup>, molecular dynamics (MD) tools<sup>[<xref ref-type="bibr" rid="B97">97</xref>-<xref ref-type="bibr" rid="B99">99</xref>]</sup>, and automated experiment execution and workflow tools<sup>[<xref ref-type="bibr" rid="B100">100</xref>-<xref ref-type="bibr" rid="B103">103</xref>]</sup>.</p>
        <p>Evaluation and benchmarking<break/>Existing evaluation practices for scientific LLMs and agents span a spectrum from static, capability-oriented benchmarks (e.g., domain QA<sup>[<xref ref-type="bibr" rid="B104">104</xref>-<xref ref-type="bibr" rid="B106">106</xref>]</sup>, materials synthesis tasks<sup>[<xref ref-type="bibr" rid="B107">107</xref>]</sup>) to workflow-level assessments that test multi-step planning and tool use, and finally to realistic multimodal settings that require cross-document reasoning. Recently, several new benchmarks have further expanded this landscape, including scenario- and project-grounded evaluations for discovery workflows<sup>[<xref ref-type="bibr" rid="B110">110</xref>]</sup>, hierarchical multimodal evaluations from localized perception to full-document synthesis<sup>[<xref ref-type="bibr" rid="B109">109</xref>,<xref ref-type="bibr" rid="B110">110</xref>]</sup>, cognition-oriented multimodal evaluations that decompose scientific capability into perception, attribute understanding, and comparative reasoning across raw scientific data and multiple disciplines<sup>[<xref ref-type="bibr" rid="B111">111</xref>]</sup>, and prospective, discovery-oriented evaluations for stability screening with task-relevant decision metrics<sup>[<xref ref-type="bibr" rid="B108">108</xref>]</sup>. These provide transferable principles for next-generation benchmarking in agentic MSE. General evaluation and observability frameworks are also increasingly used to assess LLM and agent systems beyond domain-specific benchmarks. LangSmith<sup>[<xref ref-type="bibr" rid="B112">112</xref>]</sup> provides tracing, observability, and experiment-level evaluation for LLM applications and AI agents. OpenAI Evals<sup>[<xref ref-type="bibr" rid="B113">113</xref>]</sup> offers a general framework for testing whether model outputs satisfy task-specific criteria, and is widely used for systematic evaluation and model comparison. Ragas<sup>[<xref ref-type="bibr" rid="B114">114</xref>]</sup> complements these platforms with metric-driven evaluation workflows, particularly for RAG and agentic applications, including reusable metrics and evaluation pipelines.</p>
      </sec>
    </sec>
    <sec id="sec3">
      <title>THE HIERARCHY OF AUTONOMY IN MATERIALS SCIENCE AGENTS</title>
      <p>As discussed in previous sections, we focus on five key tasks in MSE research: literature retrieval and hypothesis generation, property prediction and design, simulation and multiscale modeling, automated experimental synthesis, and characterization and data analysis. These tasks are selected to span the full spectrum of materials research, from abstract knowledge reasoning to concrete physical realization. Collectively, they capture how information flows through the research and development pipeline, where hypotheses are formed from literature, tested through simulations, verified in experiments, and interpreted through characterization and data analysis.</p>
      <p>Each task offers a distinct perspective for examining the advancement of agentic MSE. Crucially, the progression of autonomy is not uniform across these domains. Within the same task, systems can operate at different levels of autonomy - from simple assistants that conceptually interact with humans (Level 1) to agents capable of multi-step planning or feedback-guided execution (Level 3-4). For example, in experimental synthesis, some systems still act as assistants that suggest procedures or parameters<sup>[<xref ref-type="bibr" rid="B116">116</xref>]</sup>, while others already integrate planning with tool use and long-running execution, approaching higher autonomy through closed-loop operation<sup>[<xref ref-type="bibr" rid="B117">117</xref>]</sup>. Notably, as agents reach higher autonomy levels, the boundaries between tasks often become less clear. More advanced systems may span multiple tasks simultaneously and shift from a single-task view to a more system-level view. We discuss this in detail in the following sections.</p>
      <p>This framework facilitates a dual analysis: horizontally across distinct tasks and vertically across levels of autonomy, revealing both the disparities and synergies in current progress. Tasks that are cognitively intensive yet computationally tractable - such as text mining or property prediction - have achieved greater maturity, whereas experiment-centric tasks continue to face bottlenecks regarding robotics integration and safety control. By intersecting these dimensions, we establish a task-level view of autonomy: for each domain, we define its role, the current state of agentic systems, and the highest level of autonomy practically demonstrated to date. The following subsections discuss these tasks in detail.</p>
      <sec id="sec3-1">
        <title>IE and hypothesis generation</title>
        <p>MSE possesses a vast corpus of scientific literature, yet turning this unstructured text into structured datasets and actionable knowledge remains a significant challenge. IE tools are crucial for mining information on materials, properties, synthesis conditions, and performance metrics to build databases that accelerate materials design and understanding<sup>[<xref ref-type="bibr" rid="B118">118</xref>,<xref ref-type="bibr" rid="B119">119</xref>]</sup>. Recent advances in NLP, ranging from domain-tuned language models<sup>[<xref ref-type="bibr" rid="B40">40</xref>]</sup> to multi-agent systems (MAS)<sup>[<xref ref-type="bibr" rid="B120">120</xref>,<xref ref-type="bibr" rid="B121">121</xref>]</sup>, are advancing IE beyond simple data gathering toward active hypothesis generation for new materials and experiments<sup>[<xref ref-type="bibr" rid="B30">30</xref>]</sup>. In this section, we examine the evolution of these capabilities, classifying systems by their level of autonomy in transforming raw text into novel scientific directions. Representative systems for this task are summarized in <xref ref-type="table" rid="t3">Table 3</xref>, including a brief comparison of their autonomy levels, multi-agent settings, closed-loop capabilities, equipment integration, and open-source availability. Similar summary tables are provided for each task in the following sections; therefore, this note is not repeated thereafter.</p>
        <table-wrap id="t3">
          <label>Table 3</label>
          <caption>
            <p>Representative systems for IE and hypothesis generation</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Methods</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Year</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Autonomy level</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Multi-agent</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Closed-loop</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Equipment integration</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Open source</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Agentic system</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td>ChemicalTagger<sup>[<xref ref-type="bibr" rid="B122">122</xref>]</sup></td>
                <td>2011</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>ChemDataExtractor<sup>[<xref ref-type="bibr" rid="B123">123</xref>]</sup></td>
                <td>2016</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>△</td>
                <td>×</td>
              </tr>
              <tr>
                <td>Mat2Vec<sup>[<xref ref-type="bibr" rid="B125">125</xref>]</sup></td>
                <td>2019</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>Materials NER<sup>[<xref ref-type="bibr" rid="B126">126</xref>]</sup></td>
                <td>2019</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>△</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>Dunn <italic>et al.</italic><sup>[<xref ref-type="bibr" rid="B130">130</xref>]</sup></td>
                <td>2022</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
              </tr>
              <tr>
                <td>Yan <italic>et al.</italic><sup>[<xref ref-type="bibr" rid="B119">119</xref>]</sup></td>
                <td>2022</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>Action_extractor<sup>[<xref ref-type="bibr" rid="B127">127</xref>]</sup></td>
                <td>2023</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>SFBC<sup>[<xref ref-type="bibr" rid="B128">128</xref>]</sup></td>
                <td>2023</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>MatKG<sup>[<xref ref-type="bibr" rid="B64">64</xref>]</sup></td>
                <td>2024</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>MGED-KG<sup>[<xref ref-type="bibr" rid="B65">65</xref>]</sup></td>
                <td>2024</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>MOF-KG<sup>[<xref ref-type="bibr" rid="B129">129</xref>]</sup></td>
                <td>2024</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>Silva <italic>et al.</italic><sup>[<xref ref-type="bibr" rid="B132">132</xref>]</sup></td>
                <td>2024</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
              </tr>
              <tr>
                <td>MaTableGPT<sup>[<xref ref-type="bibr" rid="B131">131</xref>]</sup></td>
                <td>2025</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>HoneyBee<sup>[<xref ref-type="bibr" rid="B133">133</xref>]</sup></td>
                <td>2023</td>
                <td>L2</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>HoneyComb<sup>[<xref ref-type="bibr" rid="B14">14</xref>]</sup></td>
                <td>2024</td>
                <td>L2</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
              </tr>
              <tr>
                <td>Eunomia<sup>[<xref ref-type="bibr" rid="B12">12</xref>]</sup></td>
                <td>2024</td>
                <td>L2</td>
                <td>×</td>
                <td>△</td>
                <td>×</td>
                <td>√</td>
                <td>√</td>
              </tr>
              <tr>
                <td>SciMON<sup>[<xref ref-type="bibr" rid="B134">134</xref>]</sup></td>
                <td>2024</td>
                <td>L3</td>
                <td>√</td>
                <td>△</td>
                <td>×</td>
                <td>√</td>
                <td>△</td>
              </tr>
              <tr>
                <td>Liu <italic>et al.</italic><sup>[<xref ref-type="bibr" rid="B120">120</xref>]</sup></td>
                <td>2025</td>
                <td>L3</td>
                <td>√</td>
                <td>√</td>
                <td>×</td>
                <td>×</td>
                <td>△</td>
              </tr>
              <tr>
                <td>SciAgents<sup>[<xref ref-type="bibr" rid="B121">121</xref>]</sup></td>
                <td>2025</td>
                <td>L3</td>
                <td>√</td>
                <td>√</td>
                <td>△</td>
                <td>√</td>
                <td>√</td>
              </tr>
              <tr>
                <td>AccelMat<sup>[<xref ref-type="bibr" rid="B30">30</xref>]</sup></td>
                <td>2025</td>
                <td>L4</td>
                <td>√</td>
                <td>√</td>
                <td>×</td>
                <td>√</td>
                <td>√</td>
              </tr>
              <tr>
                <td>PriM<sup>[<xref ref-type="bibr" rid="B135">135</xref>]</sup></td>
                <td>2025</td>
                <td>L4</td>
                <td>√</td>
                <td>√</td>
                <td>×</td>
                <td>√</td>
                <td>√</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>Notes: √ = present; × = absent; △ = partial or simulated integration. IE: Information extraction; MatKG: Knowledge Graph of Materials Science; MGED-KG: Materials Genome Engineering Database Knowledge Graph; MOF-KG: Metal-Organic Framework Knowledge Graph.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>
          <bold>Level 1.</bold> Research at Level 1 focuses on automating specific, labor-intensive tasks within the scientific workflow, particularly IE and the construction of structured knowledge bases from unstructured literature. These systems act as intelligent assistants, parsing vast amounts of text to provide structured data that humans or downstream models can utilize. Early foundational efforts relied on rule-based systems and statistical pipelines. Tools such as ChemicalTagger<sup>[<xref ref-type="bibr" rid="B122">122</xref>]</sup> employ grammar-based parsing to identify chemical action phrases, while ChemDataExtractor<sup>[<xref ref-type="bibr" rid="B123">123</xref>,<xref ref-type="bibr" rid="B124">124</xref>]</sup> combines part-of-speech tagging with rule-based logic to resolve interdependencies between text and tables for precise entity extraction. Subsequent approaches integrated deep learning to scale these capabilities. Mat2Vec<sup>[<xref ref-type="bibr" rid="B125">125</xref>]</sup> demonstrates that unsupervised word embeddings could capture latent chemical knowledge to predict future materials, a concept expanded by Materials NER<sup>[<xref ref-type="bibr" rid="B126">126</xref>]</sup> to mine inorganic materials from millions of abstracts. To address data scarcity in specialized domains such as superalloys, semi-supervised frameworks<sup>[<xref ref-type="bibr" rid="B119">119</xref>]</sup> including Action_extractor<sup>[<xref ref-type="bibr" rid="B127">127</xref>]</sup> have been developed, with SFBC<sup>[<xref ref-type="bibr" rid="B128">128</xref>]</sup> further refining accuracy by combining dynamic and static embeddings.</p>
        <p>These extraction efforts evolve toward the construction of semantic KGs and the integration of LLMs. Systems such as MatKG (Knowledge Graph of Materials Science)<sup>[<xref ref-type="bibr" rid="B64">64</xref>]</sup> and MGED-KG (Materials Genome Engineering Database Knowledge Graph)<sup>[<xref ref-type="bibr" rid="B65">65</xref>]</sup> integrate entities into semantically linked networks, while MOF-KG (Metal-Organic Framework Knowledge Graph)<sup>[<xref ref-type="bibr" rid="B129">129</xref>]</sup> adds an LLM-powered interface for natural language querying. Concurrently, LLMs revolutionize extraction flexibility: Dunn <italic>et al.</italic> utilize fine-tuned models for joint entity-relation extraction<sup>[<xref ref-type="bibr" rid="B130">130</xref>]</sup>, while MaTableGPT<sup>[<xref ref-type="bibr" rid="B131">131</xref>]</sup> and Silva <italic>et al.</italic><sup>[<xref ref-type="bibr" rid="B132">132</xref>]</sup> leverage advanced serialization strategies to extract complex synthesis protocols and tabular data with high precision.</p>
        <p>
          <bold>Level 2.</bold> Level 2 agents distinguish themselves by augmenting textual analysis with external tools and domain-specific knowledge, enabling robust, context-aware data curation. Unlike Level 1 systems that rely solely on pattern recognition within text, these agents can actively query databases, invoke APIs, or utilize specialized modules to validate and refine extracted information, thereby transforming static extraction into a dynamic and verified process. HoneyBee<sup>[<xref ref-type="bibr" rid="B133">133</xref>]</sup>, an LLM progressively instruction-tuned for MSE, exemplifies this capability by generating trustworthy instruction data via MatSci-Instruct to execute domain-specific tasks with higher fidelity than general-purpose models. Building on this, HoneyComb<sup>[<xref ref-type="bibr" rid="B14">14</xref>]</sup> integrates a high-quality knowledge base (MatSciKB) with a sophisticated tool hub (ToolHub). It employs an inductive tool construction method to generate and refine API tools, allowing the agent to adaptively select and utilize appropriate tools for complex queries, thereby bridging the gap between static knowledge and dynamic tool execution. Furthermore, Eunomia<sup>[<xref ref-type="bibr" rid="B12">12</xref>]</sup> represents an agent-based framework where LLMs autonomously create structured datasets from literature and derive design guidelines. These systems showcase Level 2 autonomy by orchestrating the flow from raw text to actionable insights through tool use, though they remain single-agent planners.</p>
        <p>
          <bold>Level 3.</bold> Level 3 agents transcend the execution of predefined workflows, exhibiting advanced capabilities in reasoning, planning, and generating novel scientific hypotheses. Operating as collaborative planners, they often employ multi-agent architectures to explore vast knowledge spaces. Liu <italic>et al.</italic> demonstrated that LLMs coupled with prompt engineering can generate valid materials design hypotheses that extend beyond the explicit knowledge of human designers<sup>[<xref ref-type="bibr" rid="B120">120</xref>]</sup>. By integrating diverse scientific principles, the model successfully proposed novel high-entropy alloys and halide solid electrolytes, which were subsequently validated in recent literature. Advancing the multi-agent paradigm, SciAgents<sup>[<xref ref-type="bibr" rid="B121">121</xref>]</sup> automates discovery through intelligent graph reasoning. It employs a suite of specialized agents (e.g., Ontologist, Scientist, Critic) that interact with an ontological KG to reveal hidden interdisciplinary relationships, generating hypotheses with precision that surpasses traditional methods. Furthermore, SciMON<sup>[<xref ref-type="bibr" rid="B134">134</xref>]</sup> ensures the novelty of generated hypotheses by retrieving “inspirations” from past literature and iteratively comparing generated ideas against prior work, addressing the common issue of low technical novelty in standard LLM outputs.</p>
        <p>
          <bold>Exploration of Level 4.</bold> Research at Level 4 bridges the gap between digital hypothesis generation and physical execution, focusing on actionable experimental planning under real-world constraints. These agents are characterized by their ability to perform constraint-aware planning and integrate quantitative data to refine feasibility. Several recent studies have begun to explore the transition toward Level 4 autonomy. AccelMat<sup>[<xref ref-type="bibr" rid="B30">30</xref>]</sup> introduced a goal-driven and constraint-guided LLM agent framework designed to generate viable hypotheses for materials discovery under specific real-world constraints. Utilizing a curated novel dataset from recent publications, which includes explicit design goals and constraints (e.g., cost, equipment availability), the framework presents effectiveness in planning synthesis routes and experimental procedures that are not only scientifically plausible but also practically feasible. This work moves beyond abstract hypothesis generation to actionable experimental planning. PriM<sup>[<xref ref-type="bibr" rid="B135">135</xref>]</sup> takes a further step by not only generating principle-guided hypotheses through multi-agent collaboration but also validating them within a surrogate model-based virtual laboratory. Although the experimental loop remains digital, this approach moves beyond static planning toward automated hypothesis-validation workflows that approximate physical closed-loop execution.</p>
        <p>
          <bold>Vision for Level 5.</bold> While Level 4 agents demonstrate advanced planning and partial closed-loop capabilities, significant challenges remain in realizing fully autonomous discovery, positioning Level 5 primarily as a visionary goal. The primary barrier is the lack of continuous physical grounding. Current advanced agents operate predominantly within a digital hypothesis space and lack direct interfaces to control physical experiments or robotic platforms. Furthermore, while systems such as those proposed by AccelMat<sup>[<xref ref-type="bibr" rid="B30">30</xref>]</sup> and PriM<sup>[<xref ref-type="bibr" rid="B135">135</xref>]</sup> incorporate principle-guided reasoning and simulated validation, they operate without an active learning loop that autonomously requests experiments to resolve uncertainties. A true Level 5 “AI Scientist” would operate as a peer to human researchers, capable of identifying gaps in current theory, formulating original hypotheses, and managing the entire lifecycle of validation without human intervention. Future research should focus on integrating these reasoning engines with automated laboratory hardware (e.g., self-driving labs<sup>[<xref ref-type="bibr" rid="B37">37</xref>,<xref ref-type="bibr" rid="B136">136</xref>]</sup>) to create a truly closed-loop system where hypotheses are continuously tested and refined against physical reality.</p>
      </sec>
      <sec id="sec3-2">
        <title>Property prediction and design</title>
        <p>Advances in AI-driven property prediction and materials design are transforming how researchers discover and optimize new materials. Accurately predicting material properties or inversely designing materials with desired characteristics is crucial for accelerating the development of technologies in energy, electronics, catalysis, and related fields<sup>[<xref ref-type="bibr" rid="B57">57</xref>]</sup>. Traditionally, property prediction relied on experimental measurements or physics-based simulations, while inverse design was often a laborious trial-and-error process. Today, LLM-based agents are emerging as powerful tools to address these challenges. This section examines approaches for forward prediction and inverse design, structured according to ascending levels of agent autonomy, as summarized in <xref ref-type="table" rid="t4">Table 4</xref>.</p>
        <table-wrap id="t4">
          <label>Table 4</label>
          <caption>
            <p>Representative systems for property prediction and design</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Methods</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Year</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Autonomy level</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Multi-agent</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Closed-loop</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Equipment integration</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Open source</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Agentic system</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td>AlloyBERT<sup>[<xref ref-type="bibr" rid="B52">52</xref>]</sup></td>
                <td>2024</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>LLM-Prop<sup>[<xref ref-type="bibr" rid="B43">43</xref>]</sup></td>
                <td>2025</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>MatterChat<sup>[<xref ref-type="bibr" rid="B57">57</xref>]</sup></td>
                <td>2025</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
              </tr>
              <tr>
                <td>LLM-Fusion<sup>[<xref ref-type="bibr" rid="B137">137</xref>]</sup></td>
                <td>2025</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
              </tr>
              <tr>
                <td>ChatGPT Material Explorer<sup>[<xref ref-type="bibr" rid="B138">138</xref>]</sup></td>
                <td>2025</td>
                <td>L2</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>△</td>
                <td>√</td>
              </tr>
              <tr>
                <td>Rep-CodeGen<sup>[<xref ref-type="bibr" rid="B155">155</xref>]</sup></td>
                <td>2025</td>
                <td>L3</td>
                <td>√</td>
                <td>√</td>
                <td>×</td>
                <td>√</td>
                <td>√</td>
              </tr>
              <tr>
                <td>SparksMatter<sup>[<xref ref-type="bibr" rid="B156">156</xref>]</sup></td>
                <td>2025</td>
                <td>L3</td>
                <td>√</td>
                <td>√</td>
                <td>△</td>
                <td>√</td>
                <td>√</td>
              </tr>
              <tr>
                <td>MARS<sup>[<xref ref-type="bibr" rid="B31">31</xref>]</sup></td>
                <td>2026</td>
                <td>L4</td>
                <td>√</td>
                <td>√</td>
                <td>√</td>
                <td>√</td>
                <td>√</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>Notes: √ = present; × = absent; △ = partial or simulated integration. LLM: Large language model.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>
          <bold>Level 1.</bold> At the foundational Level 1, agents function as assistive tools for information retrieval and analysis in property prediction and design. Early systems such as ChemDataExtractor<sup>[<xref ref-type="bibr" rid="B123">123</xref>]</sup> utilized rule-based methods to parse scientific texts. More recent approaches, such as LLM-Prop<sup>[<xref ref-type="bibr" rid="B43">43</xref>]</sup>, leverage natural language descriptions of crystals to predict properties, while AlloyBERT<sup>[<xref ref-type="bibr" rid="B52">52</xref>]</sup> predicts alloy properties from human-readable text. Advanced systems such as MatterChat<sup>[<xref ref-type="bibr" rid="B57">57</xref>]</sup> and LLM-Fusion<sup>[<xref ref-type="bibr" rid="B137">137</xref>]</sup> can integrate multimodal inputs (text, structure, fingerprints) to engage in complex dialogue and analysis. However, these systems remain passive, requiring users to direct all actions, and thus demonstrate Level 1 autonomy: they assist in property prediction and design tasks, but lack capabilities for autonomous planning, tool invocation, integration with experimental equipment, and closed-loop functionality.</p>
        <p>
          <bold>Level 2.</bold> At Level 2, agents are expected to advance to acquire the ability to invoke external computational or simulation tools, evolving from passive assistants to active implementers. A representative example is ChatGPT Material Explorer<sup>[<xref ref-type="bibr" rid="B138">138</xref>]</sup>, which can autonomously search materials databases and execute GNN-based property predictors in response to natural language queries. This Level 2 paradigm relies on a robust toolbox of specialized computational models for property prediction and design:</p>
        <p>• Forward Prediction Tools: These tools span composition-input predictors such as CrabNet<sup>[<xref ref-type="bibr" rid="B139">139</xref>]</sup>, ElemNet<sup>[<xref ref-type="bibr" rid="B140">140</xref>]</sup>, and Roost<sup>[<xref ref-type="bibr" rid="B141">141</xref>]</sup>, structure-input models such as MoMa<sup>[<xref ref-type="bibr" rid="B142">142</xref>]</sup>, Crystalformer<sup>[<xref ref-type="bibr" rid="B143">143</xref>]</sup>, and other crystal-graph architectures<sup>[<xref ref-type="bibr" rid="B144">144</xref>-<xref ref-type="bibr" rid="B146">146</xref>]</sup>, and emerging text-input predictors capable of inferring properties directly from natural language descriptions of materials such as PolyBERT<sup>[<xref ref-type="bibr" rid="B50">50</xref>]</sup>. Together, these established models provide a unified computational substrate for agents to rapidly evaluate candidates from structure or composition to target properties.</p>
        <p>• Generative Design Tools: These tools include early generative models such as CrystalGAN<sup>[<xref ref-type="bibr" rid="B147">147</xref>]</sup> and MolGPT<sup>[<xref ref-type="bibr" rid="B148">148</xref>]</sup>, which demonstrated the feasibility of generative modeling for crystalline and molecular systems, respectively, as well as highly advanced goal-conditioned generators<sup>[<xref ref-type="bibr" rid="B149">149</xref>]</sup> such as PLaID++<sup>[<xref ref-type="bibr" rid="B150">150</xref>]</sup> and MatterGEN<sup>[<xref ref-type="bibr" rid="B151">151</xref>]</sup>, which uses preference optimization to generate stable crystals meeting specific criteria.</p>
        <p>• <italic>In-Silico</italic> Optimization Loops: The most advanced Level 2 workflows chain these tools into autonomous computational loops. For example, the deep RL agent by Pan <italic>et al.</italic> autonomously explores chemical space in simulation to discover compounds<sup>[<xref ref-type="bibr" rid="B152">152</xref>]</sup>. Similarly, the “deep dreaming” approach for metal-organic frameworks (MOFs)<sup>[<xref ref-type="bibr" rid="B153">153</xref>]</sup> integrates a generator and predictor into a self-contained <italic>in silico</italic> closed loop to iteratively optimize structures. Sequential optimization strategies such as Bayesian optimization<sup>[<xref ref-type="bibr" rid="B154">154</xref>]</sup>, when integrated with forward property predictors, offer an additional route to efficient <italic>in silico</italic> search by guiding exploration toward high-performing regions of vast design spaces.</p>
        <p>These tool-augmented agents can execute complex multi-step computational tasks. While systems such as the RL agent exhibit a form of <italic>in silico</italic> closed-loop behavior, they remain at Level 2, as they operate as single-agent systems without physical equipment integration.</p>
        <p>
          <bold>Level 3.</bold> Level 3 is characterized by autonomous orchestration, where multiple role-specialized agents collaborate as a planning team for property prediction and design. Rep-CodeGen<sup>[<xref ref-type="bibr" rid="B155">155</xref>]</sup> is a representative example: a team of LLM agents iteratively writes, tests, and refines Python code to generate new material representations, and this closed-loop collaboration can discover representation schemes that improve property prediction accuracy. This marks a clear shift from a single tool-using agent (Level 2) to multi-agent collaboration within longer workflow pipelines. Beyond code-centered pipelines, SparksMatter<sup>[<xref ref-type="bibr" rid="B156">156</xref>]</sup> further illustrates Level 3 behavior at the task level. When given a high-level goal such as “design a soft semiconductor material”, its planning agent can identify that the request implies multiple sub-tasks and organize the workflow accordingly. Moreover, during prediction, the agent does not only output a numeric value but also provide chain-of-thought reasoning explanations for why a prediction is made and which factors drive the result, thereby improving interpretability for downstream design decisions. Overall, Level 3 systems can form closed loops within the computational domain, but they remain purely <italic>in silico</italic> without direct integration with laboratory hardware for physical experimentation.</p>
        <p>
          <bold>Exploration of Level 4 and Level 5.</bold> The latter stages, Level 4 and Level 5, require linking autonomous computational planning with physical experimentation, and eventually with scientific problem discovery and validation. A key step from Level 3 to Level 4 is moving beyond <italic>in silico</italic> optimization toward physical closed-loop control by integrating agents with robotic lab platforms such as A-Lab<sup>[<xref ref-type="bibr" rid="B18">18</xref>]</sup> or ChemOS 2.0<sup>[<xref ref-type="bibr" rid="B25">25</xref>]</sup>. In the property prediction and design setting, recent systems such as MARS<sup>[<xref ref-type="bibr" rid="B31">31</xref>]</sup> begin to explore this direction by combining knowledge-grounded reasoning (e.g., hybrid RAG over domain literature) with tool-based analysis and coordinated execution. This enables predictions and decisions to be updated using real experimental feedback rather than remaining purely digital. Looking toward Level 5, agents should be able to autonomously select appropriate design and prediction strategies and integrate them into full experiment–computation validation loops, so that inverse design goals can be solved end-to-end with minimal human input. Achieving this level will require robust integration across tools and instruments, reliable closed-loop lab control, and multi-step reasoning that remains stable under real-world uncertainty.</p>
      </sec>
      <sec id="sec3-3">
        <title>Simulation and multiscale modeling</title>
        <p>In MSE, simulation is a crucial tool for designing new materials, validating conceptual hypotheses, and understanding material behaviors. Typical material simulation workflows can be classified into quantum mechanical calculations, atomistic simulations, mesoscale simulations, and continuum simulations. Traditionally (Level 0), these workflows required extensive manual effort: researchers had to construct simulation models manually, define assumptions and boundary conditions, select and calibrate parameters, and repeatedly debug numerical instabilities or convergence failures. Furthermore, bridging multiple scales posed additional challenges, as quantum, atomistic, and continuum simulations operate under different physical assumptions, resolution limits, and computational costs, making their integration into a coherent pipeline both time-consuming and error-prone. In recent years, data-driven machine learning models and autonomous agents have begun to augment this paradigm, creating a new ecosystem of powerful computational tools and automated workflows. Representative systems for material simulations are summarized in <xref ref-type="table" rid="t5">Table 5</xref>.</p>
        <table-wrap id="t5">
          <label>Table 5</label>
          <caption>
            <p>Representative systems for simulation and multiscale modeling</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Methods</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Year</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Autonomy level</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Multi-agent</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Closed-loop</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Equipment integration</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Open source</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Agentic system</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td>NequIP<sup>[<xref ref-type="bibr" rid="B161">161</xref>]</sup></td>
                <td>2022</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>M3GNet<sup>[<xref ref-type="bibr" rid="B166">166</xref>]</sup></td>
                <td>2022</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>MACE<sup>[<xref ref-type="bibr" rid="B164">164</xref>]</sup></td>
                <td>2024</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>DPA-2<sup>[<xref ref-type="bibr" rid="B163">163</xref>]</sup></td>
                <td>2024</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>MatterSim<sup>[<xref ref-type="bibr" rid="B165">165</xref>]</sup></td>
                <td>2024</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>MDAgent<sup>[<xref ref-type="bibr" rid="B170">170</xref>]</sup></td>
                <td>2025</td>
                <td>L2</td>
                <td>×</td>
                <td>△</td>
                <td>×</td>
                <td>√</td>
                <td>√</td>
              </tr>
              <tr>
                <td>MDCrow<sup>[<xref ref-type="bibr" rid="B169">169</xref>]</sup></td>
                <td>2025</td>
                <td>L2</td>
                <td>×</td>
                <td>△</td>
                <td>×</td>
                <td>√</td>
                <td>√</td>
              </tr>
              <tr>
                <td>AtomAgents<sup>[<xref ref-type="bibr" rid="B173">173</xref>]</sup></td>
                <td>2024</td>
                <td>L3</td>
                <td>√</td>
                <td>△</td>
                <td>×</td>
                <td>√</td>
                <td>√</td>
              </tr>
              <tr>
                <td>EI Agente<sup>[<xref ref-type="bibr" rid="B171">171</xref>]</sup></td>
                <td>2025</td>
                <td>L3</td>
                <td>√</td>
                <td>△</td>
                <td>△</td>
                <td>△</td>
                <td>√</td>
              </tr>
              <tr>
                <td>DREAMS<sup>[<xref ref-type="bibr" rid="B159">159</xref>]</sup></td>
                <td>2025</td>
                <td>L3</td>
                <td>√</td>
                <td>△</td>
                <td>△</td>
                <td>√</td>
                <td>√</td>
              </tr>
              <tr>
                <td>MooseAgent<sup>[<xref ref-type="bibr" rid="B172">172</xref>]</sup></td>
                <td>2025</td>
                <td>L3</td>
                <td>√</td>
                <td>△</td>
                <td>△</td>
                <td>√</td>
                <td>√</td>
              </tr>
              <tr>
                <td>MatSciAgent<sup>[<xref ref-type="bibr" rid="B174">174</xref>]</sup></td>
                <td>2025</td>
                <td>L3</td>
                <td>√</td>
                <td>△</td>
                <td>△</td>
                <td>√</td>
                <td>√</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>Notes: √ = present; × = absent; △ = partial or simulated integration.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>
          <bold>Level 1.</bold> At Level 1 autonomy, agents assist researchers by automating routine preprocessing tasks upon human request. One of the foundations of agentic material simulations is automated material calculation frameworks, including the atomic simulation environment (ASE)<sup>[<xref ref-type="bibr" rid="B157">157</xref>]</sup>, FireWorks<sup>[<xref ref-type="bibr" rid="B88">88</xref>]</sup>, and AiiDA<sup>[<xref ref-type="bibr" rid="B89">89</xref>]</sup>. These frameworks lay the groundwork for workflow definition and automation in material computations, ranging from density functional theory (DFT) and MD, to finite element analysis (FEA). LLM-based agents then assist with basic steps such as generating input files<sup>[<xref ref-type="bibr" rid="B158">158</xref>]</sup>, validating structural data, selecting relevant simulation parameters, and retrieving prior results from databases - thus reducing the cognitive load associated with manual model setup<sup>[<xref ref-type="bibr" rid="B159">159</xref>]</sup>. By handling these preparatory and post-processing steps, Level 1 agents reduce the manual drudgery and cognitive burden associated with model setup, allowing researchers to focus on higher-level scientific questions.</p>
        <p>Another foundational direction in applying AI to materials simulations is the use of deep learning models as surrogate solvers to replace computationally expensive physical calculations. Across quantum, atomistic, mesoscale, and continuum regimes, these models learn high-fidelity approximations of energies, forces, or field solutions, enabling orders-of-magnitude acceleration compared with first-principles or conventional numerical solvers. A representative example is the development of machine learning interatomic potentials (MLIPs), which bridge quantum and atomistic simulations by learning energy and force mappings from electronic-structure data. The predictive performance of MLIPs has been significantly improved by explicitly incorporating physical symmetries and constraints<sup>[<xref ref-type="bibr" rid="B160">160</xref>-<xref ref-type="bibr" rid="B162">162</xref>]</sup>. Moving toward more general-purpose large-scale atomistic modeling, universal potentials have been proposed to cover broader chemical and physical domains<sup>[<xref ref-type="bibr" rid="B163">163</xref>-<xref ref-type="bibr" rid="B166">166</xref>]</sup>. Another example is the application of physics-informed neural networks (PINNs) and neural partial differential equation (PDE) models for solving governing equations in mesoscale and continuum simulations<sup>[<xref ref-type="bibr" rid="B167">167</xref>,<xref ref-type="bibr" rid="B168">168</xref>]</sup>.</p>
        <p>While these works substantially improve computational efficiency and scalability, they remain passive components within the simulation pipeline, leaving the choice of simulation boundaries and scales to human researchers. Therefore, these approaches are primarily categorized as Level 1 automation that automates or accelerates specific execution, which lays the foundation for subsequent agentic systems.</p>
        <p>
          <bold>Level 2.</bold> At Level 2, agents transition from passive analysis to active engagement with the scientific toolkit. While humans still define the overarching goals, these agents can independently invoke external tools such as electronic structure codes, MD engines, materials databases, and analysis libraries to execute intermediate tasks. LLMs at this level act as a control layer that interprets high-level scientific intent and dynamically decides which computational tools to invoke, in what sequence, and with which inputs. This “Tool-Augmented” paradigm grounds the reasoning of LLMs in rigorous computational engines, overcoming the hallucination limitations of pure language models.</p>
        <p>For example, MDCrow<sup>[<xref ref-type="bibr" rid="B169">169</xref>]</sup> operates at Level 2 autonomy by enabling an LLM to dynamically select and sequence MD-related tool calls, such as solvation, OpenMM execution, and MDTraj analyses, according to high-level user objectives. These fundamental MD simulation workflows are encapsulated within an agentic toolset designed to autonomously execute MD simulations for exploration of the biochemical design space. The LLM serves as a conversational interface for coordinating, automating, and summarizing simulation steps. Similarly, MDAgents<sup>[<xref ref-type="bibr" rid="B170">170</xref>]</sup> employs a fine-tuned LLM to generate, validate, and execute MD simulation scripts, together with simple feedback loops that enable the agent to iteratively correct syntax errors or adjust simulation settings based on runtime feedback. Despite these advances, decision making at Level 2 remains task-oriented. This limitation motivates the transition to Level 3 autonomy, where agents begin to plan and orchestrate multi-step simulation campaigns with minimal human intervention.</p>
        <p>
          <bold>Level 3.</bold> Level 3 marks the emergence of autonomous orchestration, where MASs plan and execute complex simulation workflows with minimal human intervention. DREAMS<sup>[<xref ref-type="bibr" rid="B159">159</xref>]</sup> exemplifies this paradigm through a hierarchical multi-agent framework that autonomously carries out sequences of DFT calculations. Similarly, El Agente<sup>[<xref ref-type="bibr" rid="B171">171</xref>]</sup> and MooseAgent<sup>[<xref ref-type="bibr" rid="B172">172</xref>]</sup> leverage cooperating LLM agents to translate high-level natural language goals into concrete quantum chemistry or multiphysics simulation tasks while handling execution and error monitoring. AtomAgents<sup>[<xref ref-type="bibr" rid="B173">173</xref>]</sup> introduced a physics-aware, multimodal, multi-agent architecture tailored for alloy design and discovery, in which multiple specialized agents collaboratively orchestrate atomistic simulations, code execution, and multimodal result analysis. By functioning as collaborative <italic>in silico</italic> planners, these systems decompose complex computational goals and coordinate specialized agents to accomplish them, often operating in a closed loop within the simulation environment.</p>
        <p>Conceptually, tool usage under autonomous orchestration can further span across different simulation scales rather than relying solely on individual simulation tools. The development of AI-accelerated cross-scale simulation methods, as mentioned in Level 1, can be integrated into a practical simulation-based pipeline for materials design and engineering. In this context, MatSciAgent<sup>[<xref ref-type="bibr" rid="B174">174</xref>]</sup> represents a distinctive realization of Level 3 autonomy by unifying cross-scale materials simulation tasks within a modular multi-agent orchestration framework. Unlike systems that focus on coordinating a single class of simulation tools, MatSciAgent adopts a master–worker architecture in which a central agent interprets high-level natural-language requests, identifies the underlying task type, and delegates execution to specialized task-specific agents.</p>
        <p>As a result, Level 3 agentic systems for simulation tasks are capable of executing typical multiscale materials simulation workflows in response to high-level user requests by coordinating tool usage and making adaptive decisions. However, despite their advanced planning capabilities, these systems remain confined to the digital realm and lack a direct interface with the physical world.</p>
        <p>
          <bold>Exploration of Level 4 and Level 5.</bold> Although Level 3 systems mainly operate within digital simulation environments, several recent works have begun to explore Level 4 behaviors. As discussed above, systems such as DREAMS<sup>[<xref ref-type="bibr" rid="B159">159</xref>]</sup> and AtomAgents<sup>[<xref ref-type="bibr" rid="B173">173</xref>]</sup> not only plan multi-step simulation workflows, but also begin to handle long-running execution with monitoring and iterative adjustment of workflows based on intermediate results.</p>
        <p>The key step toward Level 4 in simulation and multiscale modeling is therefore not only improved planning, but also closing the loop with the physical world. This requires coupling simulation agents with laboratory automation so that experimental measurements can be used to update model assumptions, parameters, and even the selection of simulation methods, and next rounds of simulations can be scheduled and executed with minimal human intervention. In such a setting, the agent becomes the controller of an experiment-simulation loop rather than merely a simulation planner<sup>[<xref ref-type="bibr" rid="B159">159</xref>,<xref ref-type="bibr" rid="B173">173</xref>]</sup>. Level 5 extends this concept to fully autonomous scientific discovery, in which the agent can connect multiscale modeling with experimental evidence at the level of scientific reasoning<sup>[<xref ref-type="bibr" rid="B175">175</xref>]</sup>. When persistent gaps appear between predictions and observations, a Level 5 agent should be able to propose plausible physical explanations, design integrated simulation-experiment campaigns to test them, and revise its models and hypotheses based on the resulting outcomes. While this capability remains a long-term goal, it represents the ultimate fusion of computation and experimentation for autonomous materials discovery.</p>
      </sec>
      <sec id="sec3-4">
        <title>Automated experimental synthesis</title>
        <p>Experimental synthesis and characterization of new materials is the most critical step in the MSE research pipeline. It is also the most important method to validate previous property prediction and simulation results. The advent of SDLs is redefining how materials are experimentally discovered and tested, moving experimentation from traditional manual work (Level 0) to autonomous closed-loop operation<sup>[<xref ref-type="bibr" rid="B176">176</xref>]</sup>. By integrating robotics, these platforms have the potential to iteratively plan and execute experiments with minimal human input, accelerating discovery and enhancing reproducibility. Recent developments in intelligent AI systems integrated with automated fabrication platforms enable closed-loop optimization of synthesis conditions and materials processing. Representative systems and their capabilities in experimental synthesis are summarized in <xref ref-type="table" rid="t6">Table 6</xref>.</p>
        <table-wrap id="t6">
          <label>Table 6</label>
          <caption>
            <p>Representative systems for automated experimental synthesis</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Methods</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Year</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Autonomy level</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Multi-agent</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Closed-loop</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Equipment integration</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Open source</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Agentic system</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td>MatScIE<sup>[<xref ref-type="bibr" rid="B177">177</xref>]</sup></td>
                <td>2021</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>MatNexus<sup>[<xref ref-type="bibr" rid="B178">178</xref>]</sup></td>
                <td>2023</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>CRISPR-GPT<sup>[<xref ref-type="bibr" rid="B189">189</xref>]</sup></td>
                <td>2025</td>
                <td>L2</td>
                <td>×</td>
                <td>△</td>
                <td>×</td>
                <td>√</td>
                <td>√</td>
              </tr>
              <tr>
                <td>SciAgents<sup>[<xref ref-type="bibr" rid="B121">121</xref>]</sup></td>
                <td>2024</td>
                <td>L3</td>
                <td>√</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
                <td>√</td>
              </tr>
              <tr>
                <td>ChatGPTResearchGroup<sup>[<xref ref-type="bibr" rid="B181">181</xref>]</sup></td>
                <td>2023</td>
                <td>L3</td>
                <td>√</td>
                <td>√</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
              </tr>
              <tr>
                <td>LABMATE<sup>[<xref ref-type="bibr" rid="B190">190</xref>]</sup></td>
                <td>2025</td>
                <td>L3</td>
                <td>√</td>
                <td>△</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
              </tr>
              <tr>
                <td>MOSAIC<sup>[<xref ref-type="bibr" rid="B191">191</xref>]</sup></td>
                <td>2026</td>
                <td>L3</td>
                <td>√</td>
                <td>△</td>
                <td>△</td>
                <td>√</td>
                <td>△</td>
              </tr>
              <tr>
                <td>AlphaFlow<sup>[<xref ref-type="bibr" rid="B117">117</xref>]</sup></td>
                <td>2023</td>
                <td>L4</td>
                <td>×</td>
                <td>√</td>
                <td>√</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>Coscientist<sup>[<xref ref-type="bibr" rid="B17">17</xref>]</sup></td>
                <td>2023</td>
                <td>L4</td>
                <td>√</td>
                <td>√</td>
                <td>△</td>
                <td>√</td>
                <td>√</td>
              </tr>
              <tr>
                <td>AutoMEX<sup>[<xref ref-type="bibr" rid="B192">192</xref>]</sup></td>
                <td>2025</td>
                <td>L4</td>
                <td>√</td>
                <td>√</td>
                <td>√</td>
                <td>×</td>
                <td>√</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>Notes: √ = present; × = absent; △ = partial or simulated integration.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>
          <bold>Level 1.</bold> Level 1 autonomy focuses on establishing knowledge-grounded AI systems to assist physical synthesis, enabling human users to interact with the systems and acquire guidance on experimental design and optimization. This stage involves LLM-assisted analysis, where text-mining systems such as MatScIE<sup>[<xref ref-type="bibr" rid="B177">177</xref>]</sup> and MatNexus<sup>[<xref ref-type="bibr" rid="B178">178</xref>]</sup> extract critical data from scientific literature and technical manuals. These systems convert unstructured descriptive text into structured, queryable databases containing materials information and synthesis protocols. Similarly, LLMs have also been integrated into electronic experimental notebooks<sup>[<xref ref-type="bibr" rid="B179">179</xref>]</sup> to facilitate the digitization of routine materials experiments. Some preliminary studies have further utilized the generative capabilities of LLMs to directly predict synthesis pathways for inorganic<sup>[<xref ref-type="bibr" rid="B180">180</xref>]</sup> and organic<sup>[<xref ref-type="bibr" rid="B59">59</xref>]</sup> materials. These efforts reduce the burden on experimentalists by enabling rapid retrieval of protocols, identification of relevant control variables, and generation of hypothesis-driven suggestions for synthesis conditions. They also support the transformation of experience-oriented experimental knowledge into machine-readable and reusable representations, thereby improving efficiency and reproducibility. However, Level 1 systems remain advisory and lack independent planning capabilities or the ability to invoke external tools.</p>
        <p>
          <bold>Level 2.</bold> Building upon knowledge-grounded LLM systems, Level 2 agents function as “digital chemists” by invoking external computational tools for experimental planning. At this level of autonomy, LLM-based agentic systems not only rely on prior knowledge acquired during pretraining and prompt-based reasoning, but also invoke external information sources and computational capabilities to support experimental design for materials fabrication and synthesis optimization. For example, active learning-based methods can function as external tools for optimizing material fabrication parameters<sup>[<xref ref-type="bibr" rid="B181">181</xref>]</sup> or can be combined with Bayesian optimization and LLMs to enhance contextual optimization<sup>[<xref ref-type="bibr" rid="B182">182</xref>-<xref ref-type="bibr" rid="B185">185</xref>]</sup>. For synthesis pathway prediction, advanced LLMs have demonstrated significant competence in predicting reaction outcomes and retrosynthetic routes<sup>[<xref ref-type="bibr" rid="B186">186</xref>]</sup>. External knowledge systems can further enhance synthesis route prediction<sup>[<xref ref-type="bibr" rid="B187">187</xref>]</sup>. This capability is further strengthened by specialized models, such as the conditional graph logic network (GLN) for retrosynthesis<sup>[<xref ref-type="bibr" rid="B116">116</xref>]</sup> and graph-based networks for predicting solid-state synthesis routes<sup>[<xref ref-type="bibr" rid="B188">188</xref>]</sup>. Additionally, data-driven models can emulate human decision making to recommend precursors<sup>[<xref ref-type="bibr" rid="B180">180</xref>]</sup>, while AI co-pilots such as CRISPR-GPT<sup>[<xref ref-type="bibr" rid="B189">189</xref>]</sup> can automate complex experimental designs. Level 2 agents are thus capable of complex computational planning and analysis, yet they remain single-agent systems without multi-step planning capabilities or closed-loop hardware control.</p>
        <p>
          <bold>Level 3.</bold> Level 3 advances to multi-agent coordination, where specialized agents manage <italic>in silico</italic> workflows akin to those of a human research group. These works reflect the decomposition of complex experimental design tasks into subtasks that might involve previous tasks. SciAgents<sup>[<xref ref-type="bibr" rid="B121">121</xref>]</sup> conceptualizes this framework as a “team of AI agents”, in which networks of agents collaborate autonomously through iterative cycles of hypothesis generation and computational validation. ChatGPTResearchGroup<sup>[<xref ref-type="bibr" rid="B181">181</xref>]</sup> organized multiple role-specialized LLM agents to collaboratively conduct closed-loop <italic>in silico</italic> planning and Bayesian optimization for materials synthesis. LABMATE<sup>[<xref ref-type="bibr" rid="B190">190</xref>]</sup> applied this paradigm to catalysis research by orchestrating agents responsible for literature review, simulation, data analysis, and hypothesis generation within a human-in-the-loop computational copilot framework. MOSAIC<sup>[<xref ref-type="bibr" rid="B191">191</xref>]</sup> trained 2,498 specialized chemistry experts and successfully guided the synthesis of over 35 novel compounds across areas such as pharmaceuticals, materials science, and agrochemicals. Although these multi-agent planners can execute complex multi-step computational workflows, they remain disconnected from equipment integration and require human involvement for experimental execution.</p>
        <p>
          <bold>Level 4.</bold> The transition to Level 4 represents the current frontier of research, characterized by exploratory efforts to bridge the gap between digital planning, computation, and the physical execution of experiments. In this phase, pioneering systems act as autonomous planners that directly control robotic laboratories in a closed loop. This emerging capability is exemplified by LLM-driven prototypes such as Coscientist<sup>[<xref ref-type="bibr" rid="B17">17</xref>]</sup> and AutoMEX<sup>[<xref ref-type="bibr" rid="B192">192</xref>]</sup>, which demonstrate the feasibility of using AI to autonomously issue commands to cloud-based lab robots and three-dimensional (3D) printers. Other exploratory platforms leverage algorithmic optimization to guide laboratory hardware, such as the microfluidic systems for nanoparticle synthesis developed by Tao <italic>et al.</italic><sup>[<xref ref-type="bibr" rid="B193">193</xref>]</sup> and Sadeghi <italic>et al.</italic><sup>[<xref ref-type="bibr" rid="B194">194</xref>]</sup>. More advanced implementations, such as AlphaFlow<sup>[<xref ref-type="bibr" rid="B117">117</xref>]</sup>, utilize RL to control modular reactors and have successfully identified novel synthesis routes that outperform human-designed processes. Perhaps the most comprehensive demonstration of hardware flexibility is the mobile robotic chemist described by Burger <italic>et al.</italic><sup>[<xref ref-type="bibr" rid="B195">195</xref>]</sup>, which navigates a standard lab to execute closed-loop optimization. Collectively, these platforms represent early iterations of Level 4 intelligence. Although they are primarily proof-of-concept systems often orchestrated by a central planner, they successfully validate the core criteria for autonomous physical execution.</p>
        <p>
          <bold>Vision for Level 5.</bold> Beyond these emerging implementations lies the aspirational goal of Level 5, which envisions a fully autonomous agent capable of independently formulating broad hypotheses, designing novel research directions, and executing experiments without constraints. However, such a system remains a distant prospect. In the foreseeable future, human experts will remain indispensable. The consensus in the field suggests that the evolution of SDLs will likely stabilize at a human-in-the-loop hybrid model rather than achieve complete human replacement, as argued by Hysmith <italic>et al.</italic><sup>[<xref ref-type="bibr" rid="B196">196</xref>]</sup>. Ideally, this synergy between human intuition and transparent, interpretable AI will transform the laboratory into an engine of innovation, enabling scientists to tackle challenges on a previously unimaginable scale.</p>
      </sec>
      <sec id="sec3-5">
        <title>Characterization and data analysis</title>
        <p>Modern MSE relies on advanced characterization techniques that produce vast and complex datasets. These measurements probe material structures and properties across multiple length and time scales from complementary perspectives, posing significant challenges for consistent, knowledge-grounded interpretation. To overcome these challenges, relevant agents have been introduced across workflows ranging from data collection to interpretation, shifting the field from traditional manual interpretation (Level 0) toward autonomous workflows, as summarized in <xref ref-type="table" rid="t7">Table 7</xref>.</p>
        <table-wrap id="t7">
          <label>Table 7</label>
          <caption>
            <p>Representative systems for characterization and data analysis</p>
          </caption>
          <table frame="hsides" rules="groups">
            <thead>
              <tr>
                <td style="border-bottom:1;">
                  <bold>Methods</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Year</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Autonomy level</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Multi-agent</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Closed-loop</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Equipment integration</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Open source</bold>
                </td>
                <td style="border-bottom:1;">
                  <bold>Agentic system</bold>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td>MatQnA<sup>[<xref ref-type="bibr" rid="B197">197</xref>]</sup></td>
                <td>2025</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>MicroscopyGPT<sup>[<xref ref-type="bibr" rid="B204">204</xref>]</sup></td>
                <td>2025</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
              </tr>
              <tr>
                <td>S1-MMAlign<sup>[<xref ref-type="bibr" rid="B198">198</xref>]</sup></td>
                <td>2026</td>
                <td>L1</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>Chen <italic>et al.</italic><sup>[<xref ref-type="bibr" rid="B205">205</xref>]</sup></td>
                <td>2025</td>
                <td>L2</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>×</td>
                <td>√</td>
              </tr>
              <tr>
                <td>Dara<sup>[<xref ref-type="bibr" rid="B206">206</xref>]</sup></td>
                <td>2025</td>
                <td>L2</td>
                <td>×</td>
                <td>×</td>
                <td>△</td>
                <td>√</td>
                <td>×</td>
              </tr>
              <tr>
                <td>Drug Discovery Agent<sup>[<xref ref-type="bibr" rid="B207">207</xref>]</sup></td>
                <td>2025</td>
                <td>L2</td>
                <td>△</td>
                <td>×</td>
                <td>√</td>
                <td>√</td>
                <td>√</td>
              </tr>
              <tr>
                <td>MatAgent<sup>[<xref ref-type="bibr" rid="B208">208</xref>]</sup></td>
                <td>2025</td>
                <td>L2</td>
                <td>√</td>
                <td>√</td>
                <td>×</td>
                <td>√</td>
                <td>√</td>
              </tr>
              <tr>
                <td>AutoMat<sup>[<xref ref-type="bibr" rid="B210">210</xref>]</sup></td>
                <td>2025</td>
                <td>L3</td>
                <td>×</td>
                <td>√</td>
                <td>×</td>
                <td>√</td>
                <td>√</td>
              </tr>
              <tr>
                <td>IR-Agent<sup>[<xref ref-type="bibr" rid="B211">211</xref>]</sup></td>
                <td>2025</td>
                <td>L3</td>
                <td>√</td>
                <td>×</td>
                <td>√</td>
                <td>√</td>
                <td>√</td>
              </tr>
              <tr>
                <td>Multicrossmodal Agent<sup>[<xref ref-type="bibr" rid="B15">15</xref>]</sup></td>
                <td>2025</td>
                <td>L3</td>
                <td>√</td>
                <td>√</td>
                <td>△</td>
                <td>√</td>
                <td>√</td>
              </tr>
              <tr>
                <td>SciLink<sup>[<xref ref-type="bibr" rid="B209">209</xref>]</sup></td>
                <td>2025</td>
                <td>L3</td>
                <td>√</td>
                <td>√</td>
                <td>△</td>
                <td>√</td>
                <td>√</td>
              </tr>
              <tr>
                <td>AdaptiveXRD<sup>[<xref ref-type="bibr" rid="B29">29</xref>]</sup></td>
                <td>2024</td>
                <td>L4</td>
                <td>×</td>
                <td>√</td>
                <td>√</td>
                <td>√</td>
                <td>△</td>
              </tr>
              <tr>
                <td>AILA<sup>[<xref ref-type="bibr" rid="B212">212</xref>]</sup></td>
                <td>2025</td>
                <td>L4</td>
                <td>√</td>
                <td>√</td>
                <td>√</td>
                <td>√</td>
                <td>√</td>
              </tr>
              <tr>
                <td>ORGANA<sup>[<xref ref-type="bibr" rid="B213">213</xref>]</sup></td>
                <td>2025</td>
                <td>L4</td>
                <td>√</td>
                <td>△</td>
                <td>√</td>
                <td>√</td>
                <td>√</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn>
              <p>Notes: √ = present; × = absent; △= partial or simulated integration.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>
          <bold>Level 1.</bold> Level 1 serves as a materials characterization knowledge base and analytical assistant. For example, MatQnA<sup>[<xref ref-type="bibr" rid="B197">197</xref>]</sup> established a large multimodal benchmark for materials characterization techniques, including XPS, XRD, SEM, and TEM. S1-MMAlign<sup>[<xref ref-type="bibr" rid="B198">198</xref>]</sup> collected large-scale multimodal scientific image interpretation datasets, including materials science data. In addition, several AI systems have also been developed for the operation and interpretation of specific characterization techniques such as TEM<sup>[<xref ref-type="bibr" rid="B199">199</xref>]</sup>, XRD<sup>[<xref ref-type="bibr" rid="B200">200</xref>,<xref ref-type="bibr" rid="B201">201</xref>]</sup>, SEM<sup>[<xref ref-type="bibr" rid="B202">202</xref>]</sup>, and spectroscopy<sup>[<xref ref-type="bibr" rid="B203">203</xref>]</sup>, thereby reducing the expertise barrier and subjectivity inherent in manual analysis and laying the groundwork for higher-level autonomy as agentic tools. Notably, MicroscopyGPT<sup>[<xref ref-type="bibr" rid="B204">204</xref>]</sup> is a vision-language model (VLM) that solves the difficult problem of reconstructing full 3D atomic structures from 2D scanning transmission electron microscopy (STEM) images by directly mapping images to structured text. These systems fall within Level 1 as they facilitate AI-assisted IE from multimodal materials characterization data, but function as passive resources without autonomous planning or execution capabilities.</p>
        <p>
          <bold>Level 2.</bold> These data and knowledge resources fuel a new generation of Level 2 (Tool-Augmented) agents, which function as automated analysts for specific tasks. Chen <italic>et al</italic>. proposed an LLM-driven multimodal framework for detecting scale bars and extracting related information from SEM images<sup>[<xref ref-type="bibr" rid="B205">205</xref>]</sup>. The framework uses a You Only Look Once (YOLO)-based detector to localize the scale bar and a hybrid optical character recognition (OCR) system to recognize the numeric value and unit. For diffraction analysis, Dara automates multiple-hypothesis phase identification and refinement from powder XRD data by searching candidate phase combinations and programmatically performing peak matching and Rietveld refinement (accelerated via parallel execution), while using domain-aware criteria to prune candidates and decide when to stop<sup>[<xref ref-type="bibr" rid="B206">206</xref>]</sup>. Drug Discovery Agent<sup>[<xref ref-type="bibr" rid="B207">207</xref>]</sup> can follow high-level prompts to detect and classify drug–cell phenotypes from microscopy images/videos by coordinating vision modules, thereby enabling scalable and near real-time screening. In addition, general-purpose agentic frameworks such as MatAgent<sup>[<xref ref-type="bibr" rid="B208">208</xref>]</sup> show that an LLM-based MAS can run end-to-end experimental data analysis, ranging from exploratory statistics to modeling, visualization, and report generation.</p>
        <p>
          <bold>Level 3.</bold> At Level 3, agents can cope with the complexity and diversity of characterization data by using multi-step planning and agent-based architectures to take an active role in the research process. Systems such as SciLink<sup>[<xref ref-type="bibr" rid="B209">209</xref>]</sup> and AutoMat<sup>[<xref ref-type="bibr" rid="B210">210</xref>]</sup> show how agents can break down complex goals and support end-to-end automated analysis. SciLink<sup>[<xref ref-type="bibr" rid="B209">209</xref>]</sup> can turn raw characterization data into scientific hypotheses, and then assess these claims against published literature. AutoMat<sup>[<xref ref-type="bibr" rid="B210">210</xref>]</sup> uses a “plan-then-execute” design and integrates multiple tools to transform STEM image inputs into reconstructed atomic crystal structures. In spectroscopy, IR-Agent<sup>[<xref ref-type="bibr" rid="B211">211</xref>]</sup> mimics the reasoning process of human experts and employs a team of agents for feature extraction, database retrieval, and final inference of molecular structures. For multimodal data from different sources, Bazgir <italic>et al.</italic> proposed a multi-agent framework with a dynamic gating mechanism<sup>[<xref ref-type="bibr" rid="B15">15</xref>]</sup>. This framework can analyze microscopy images and simulation videos while also retrieving relevant papers and web resources to provide contextual support and improve accuracy. Overall, Level 3 systems enable data-driven inverse reasoning and greatly improve both the efficiency and reliability of extracting scientific insights from raw characterization data.</p>
        <p>
          <bold>Level 4.</bold> At Level 4, agents take on direct operational control of the physical laboratory: they can operate equipment, sustain long-running experiments, and autonomously determine how procedures should proceed during execution. AdaptiveXRD<sup>[<xref ref-type="bibr" rid="B29">29</xref>]</sup> is an autonomous and adaptive XRD system that enables agent-driven, real-time control of physical hardware and can autonomously adjust the scan step size and scan range during measurements. For complex and precise instruments such as atomic force microscopy (AFM), Artificially Intelligent Lab Assistant (AILA)<sup>[<xref ref-type="bibr" rid="B212">212</xref>]</sup> shows strong multi-agent collaboration and supports long-duration autonomous operation. Moreover, ORGANA<sup>[<xref ref-type="bibr" rid="B213">213</xref>]</sup> is a highly integrated automation platform that uses natural language interaction to automate complex chemistry experiments from end to end. It can translate high-level research goals into physical operation commands, marking a shift at Level 4 from single-instrument automation toward more system-level laboratory automation. While these platforms demonstrate promising Level 4 autonomy, they remain early prototypes rather than widely adopted and reliable systems.</p>
        <p>
          <bold>Vision for Level 5.</bold> Level 5 represents a long-term goal: a characterization agent that can work with minimal human input. Beyond operating instruments, such an agent would be able to pose meaningful research questions, choose suitable characterization methods, and integrate evidence from multiple instruments to build a complete view of new materials. This would shift the focus from simply collecting measurements to understanding what the results imply. Reaching this level, however, will require major progress in linking different instruments, standardizing data and metadata, and improving multi-step reasoning. In the near term, Level 5 should be treated as a reference point, while most practical work should focus on strengthening the human–AI collaboration patterns seen in Level 3 and Level 4.</p>
      </sec>
      <sec id="sec3-6">
        <title>Cross-task MSE agents</title>
        <p>The preceding sections examine AI agents within specific, isolated research tasks such as synthesis planning, characterization, property prediction, and simulation. While these task-specific systems have demonstrated significant capabilities, more advanced systems are now emerging that transcend single-task boundaries, integrating diverse capabilities into cohesive research pipelines<sup>[<xref ref-type="bibr" rid="B39">39</xref>,<xref ref-type="bibr" rid="B214">214</xref>]</sup>. These cross-task agents represent a shift from specialized tools to holistic research orchestrators capable of managing the full research cycle, from hypothesis generation to experimental validation.</p>
        <sec id="sec3-6-1">
          <title>Pioneering autonomous laboratories</title>
          <p>Early Level 4 systems demonstrated that robotic platforms could leverage closed-loop machine learning to accelerate discovery. Pioneering examples such as adaptive rapid experimentation and spectroscopy (ARES)<sup>[<xref ref-type="bibr" rid="B215">215</xref>]</sup> (for carbon nanotubes) and Ada<sup>[<xref ref-type="bibr" rid="B136">136</xref>]</sup> (for thin films) showed that algorithms could design, execute, and analyze experiments faster than human researchers. This paradigm was significantly advanced by A-Lab<sup>[<xref ref-type="bibr" rid="B18">18</xref>]</sup>, which integrates computation, literature mining, and robotics to autonomously discover 41 new inorganic materials within 17 days. Similarly, full-process <italic>in silico</italic> frameworks, such as the Level 3 system for perovskite solar cells developed by Ye <italic>et al.</italic><sup>[<xref ref-type="bibr" rid="B216">216</xref>]</sup>, demonstrate how agents can process heterogeneous data spanning materials, fabrication, and performance to uncover complex patterns, even without physical automation. These works highlight the power of integrating diverse data streams and operational modules into a cohesive research engine.</p>
        </sec>
        <sec id="sec3-6-2">
          <title>Unifying computational planning and physical execution</title>
          <p>Recent advances have demonstrated the integration of multi-agent planning with physical experimentation. LLM-RDF<sup>[<xref ref-type="bibr" rid="B217">217</xref>]</sup>, a framework employing specialized agents to coordinate a complete reaction development cycle - from literature search and experiment design to hardware control and spectral analysis - successfully guided the development of a novel oxidation reaction. In the computational domain, TopoMAS<sup>[<xref ref-type="bibr" rid="B218">218</xref>]</sup> orchestrates literature search, hypothesis generation, and DFT simulations in an <italic>in silico</italic> closed loop, identifying novel topological quantum materials. AGAPI-Agents<sup>[<xref ref-type="bibr" rid="B219">219</xref>]</sup> also unifies open‑source LLMs with more than 20 materials APIs to autonomously run multi‑step, tool‑grounded workflows for reproducible and accelerated materials design. Furthermore, ChemAgents<sup>[<xref ref-type="bibr" rid="B220">220</xref>]</sup> seamlessly integrates robotic experimentation, quantum simulations, and ML-driven spectral analysis to investigate azobenzene isomerization, uncovering new mechanistic insights with minimal human intervention. This framework represents a blueprint for autonomous molecular discovery, where agents manage the full “design-make-test-analyze” cycle across both digital and physical realms. To support such cross-domain reasoning, multimodal frameworks such as MatterChat<sup>[<xref ref-type="bibr" rid="B57">57</xref>]</sup> enable agents to process both textual knowledge and structural data, bridging the gap between literature understanding and atomic-level design.</p>
        </sec>
      </sec>
    </sec>
    <sec id="sec4">
      <title>FUTURE WORK</title>
      <sec id="sec4-1">
        <title>Current challenges and inherent limitations</title>
        <p>Our analysis through the six-level framework reveals that the current research gaps in agentic MSE fall into two distinct categories, defined by the nature of the tasks involved.</p>
        <sec id="sec4-1-1">
          <title>Cognition-centric challenges</title>
          <p>These challenges primarily emerge in tasks such as information retrieval, property prediction, and simulation, which operate in the digital domain and rely on the reasoning capabilities of LLMs. Despite rapid progress, current systems are constrained by the intrinsic limitations of LLMs when applied to scientific domains. MSE data are often sparse, heterogeneous, and highly structured, yet LLMs typically process such data as ungrounded text. Consequently, retrieval agents may miss critical context, property predictors may extrapolate beyond physical validity, and simulation planners may generate workflows that are linguistically coherent but numerically unstable. Fundamentally, these systems often lack robust mechanisms for enforcing physical laws, estimating uncertainty, and recovering from failures, hindering their progression to higher levels of autonomous reasoning.</p>
        </sec>
        <sec id="sec4-1-2">
          <title>Execution-centric challenges</title>
          <p>This second category primarily appears in experimental synthesis and materials characterization, where the dominant difficulty shifts from language-based reasoning to physical interaction and real-world control. In materials science research, the execution bottleneck is driven by the heterogeneous and non-standardized nature of laboratory environments, including diverse software–hardware interfaces, inconsistent data formats, and the intrinsic variability of material samples. These factors introduce substantial noise and uncertainty into experimental processes, making reliable execution significantly more challenging than in purely digital settings. Such execution-centric settings also expose reliability problems in instruction adherence. Recent AFM automation studies have shown that LLM agents can take extra actions beyond the given protocol, sometimes acting as if they rely on prior context or memory rather than the current instruction - a behavior referred to as “sleepwalking”<sup>[<xref ref-type="bibr" rid="B212">212</xref>]</sup>. This behavior can appear as risky physical actions beyond authorized limits or as functional code that exceeds the specified requirements, reflecting instruction drift during execution. Such behavior raises clear concerns regarding operational safety and the validity of closed-loop experiments.</p>
          <p>Recent advances in collaborative robotics and automated laboratories have led to the development of middleware frameworks, hardware standardization efforts, and communication protocols (e.g., SiLA<sup>[<xref ref-type="bibr" rid="B221">221</xref>]</sup>, ChemOS<sup>[<xref ref-type="bibr" rid="B25">25</xref>,<xref ref-type="bibr" rid="B222">222</xref>]</sup>, Robot Operating System<sup>[<xref ref-type="bibr" rid="B223">223</xref>]</sup>), which provide an important technical pathway for device coordination and standardization in materials science labs. However, integrating agentic systems into these infrastructures remains non-trivial, as there still exists a gap between agent-level reasoning and device-level communication. Looking forward, an additional challenge lies in enabling effective human–agent collaboration, as future laboratory environments are likely to involve hybrid workflows in which autonomous systems and human operators must co-adapt, share context, and coordinate decisions under uncertainty.</p>
          <p>Uncertainty is another fundamental challenge that permeates all aspects of agentic MSE<sup>[<xref ref-type="bibr" rid="B224">224</xref>]</sup>. At the single-agent level, uncertainty arises from the stochastic nature of LLM outputs, irreducible noise in experimental measurements, and approximation errors in computational simulations<sup>[<xref ref-type="bibr" rid="B225">225</xref>]</sup>. In MASs, these uncertainties do not remain local; instead, they can propagate across agents and even be amplified in a cascading manner. For example, an incorrect assumption introduced during IE may bias downstream property prediction and ultimately lead to suboptimal or even incorrect synthesis decisions<sup>[<xref ref-type="bibr" rid="B226">226</xref>]</sup>. To build trustworthy agentic MSE systems, uncertainty quantification should therefore evolve from a passive monitoring signal into an active control signal. In this context, the agentic uncertainty quantification (AUQ) framework<sup>[<xref ref-type="bibr" rid="B227">227</xref>]</sup> offers a promising direction. Inspired by dual-process theories of human cognition, AUQ converts uncertainty into a closed-loop behavioral signal through uncertainty-aware memory and uncertainty-aware reflection, aiming to mitigate hallucination cascades in long-horizon agent trajectories. More broadly, uncertainty in agentic MSE should not be treated solely as a property of model outputs, but as a system-level quantity that governs whether an agent should continue execution, request additional evidence, trigger self-correction, or defer to human oversight. This issue will become even more important as agentic MSE moves from laboratory prototypes toward industrial deployment, where robustness, reliability, and governance under uncertainty are essential.</p>
          <p>Collectively, these challenges reveal that higher autonomy cannot be achieved by optimizing individual components in isolation. Instead, it requires tightly integrated systems that are knowledge-grounded for cognitive reasoning, perception-aware for physical execution, and equipped with principled mechanisms to quantify, propagate, and act on uncertainty at both the agent and system levels.</p>
        </sec>
      </sec>
      <sec id="sec4-2">
        <title>Strategic directions for future research</title>
        <p>To overcome these hurdles, future research must pivot from purely data-driven approaches toward the development of physically grounded and robustly embodied agents.</p>
        <sec id="sec4-2-1">
          <title>Physically grounded intelligence</title>
          <p>A critical step in addressing cognitive limitations is the development of Hybrid Neuro-Symbolic Reasoning systems<sup>[<xref ref-type="bibr" rid="B228">228</xref>]</sup>. By constraining the generative fluency of LLMs with thermodynamic verifiers and physics-informed logic, agents can ensure their hypotheses are not only novel but also physically viable. This approach entails training agents on “negative data” and physics-informed datasets to instill a form of scientific “common sense”, effectively preventing the proposal of chemically unreasonable candidates.</p>
        </sec>
        <sec id="sec4-2-2">
          <title>Closing the physical execution gap</title>
          <p>To address execution-centric challenges, future systems must move beyond simple API calls to incorporate Active Perception, empowering agents to monitor experiments via computer vision and multimodal sensor feedback. This sensorimotor integration is essential for agents to adaptively correct errors in real time - such as detecting precipitation failures or blocked needles - rather than proceeding blindly. This capability is the foundation for creating truly adaptive and resilient autonomous laboratories.</p>
        </sec>
        <sec id="sec4-2-3">
          <title>Dynamic evaluation and benchmarking</title>
          <p>Establishing robust metrics is essential for quantifying progress across the proposed six-level autonomy hierarchy. Existing benchmarks, such as MatSciBench<sup>[<xref ref-type="bibr" rid="B104">104</xref>]</sup> and MSQA<sup>[<xref ref-type="bibr" rid="B105">105</xref>]</sup>, mainly evaluate static reasoning or isolated property prediction, and therefore provide limited coverage of agentic behavior in long-horizon scientific workflows. However, evaluating an autonomous agent is fundamentally different from evaluating a static LLM: beyond final-answer correctness, it also requires assessing the quality of the reasoning trajectory, including multi-step planning, tool selection, feedback utilization, error recovery, and avoidance of unproductive loops. Recent benchmark efforts have begun to move in this direction. For example, SciAgentGym<sup>[<xref ref-type="bibr" rid="B229">229</xref>]</sup> explicitly evaluates long-horizon scientific tool use and analyzes process-level behaviors such as adaptation to execution errors, parameter tuning, strategic switching, loop escape, and recovery dynamics across interaction steps. Likewise, SGI-Bench<sup>[<xref ref-type="bibr" rid="B230">230</xref>]</sup> frames evaluation around scientist-aligned workflows, covering deep research, idea generation, dry/wet experiments, and experimental reasoning, and further introduces an agent-based evaluation framework to support multi-dimensional assessment.</p>
          <p>Future benchmarking efforts should therefore move beyond outcome-only scoring and incorporate trajectory-level criteria that capture whether an agent can sustain coherent multi-step reasoning, recover from failures, and interact reliably with tools, data, and experimental systems. Such dynamic evaluation testbeds, ideally coupled with realistic noise, hardware constraints, and failure modes, will be essential for assessing agentic resilience in MSE and for charting progress toward fully autonomous AI materials scientists.</p>
        </sec>
        <sec id="sec4-2-4">
          <title>Safety and governance</title>
          <p>Finally, as agents evolve from advisory roles at lower levels to synthesis planning and direct physical execution at higher levels, their dual-use risks become increasingly serious, making safety and governance more critical. The development of autonomous systems requires robust and deterministic safety guardrails, together with specialized safety assessment tools and governance frameworks throughout the agent development lifecycle. To address dual-use risks, a range of advanced red-teaming methods for scientific agents has recently emerged<sup>[<xref ref-type="bibr" rid="B231">231</xref>]</sup>. In addition, the development of standardized safety benchmarks for toxicity screening is a necessary step toward measuring progress<sup>[<xref ref-type="bibr" rid="B232">232</xref>]</sup>. Relevant protocols should verify every chemical instruction against strict safety databases to ensure that the pursuit of autonomous discovery never compromises laboratory safety<sup>[<xref ref-type="bibr" rid="B175">175</xref>]</sup>. In the long term, trustworthy deployment will also require uncertainty-aware governance, in which quantified uncertainty is used not only for post hoc diagnosis, but also for real-time control, escalation, and safety intervention.</p>
        </sec>
        <sec id="sec4-2-5">
          <title>Ecosystem integration and real-world deployment</title>
          <p>Future agentic MSE systems will need to operate within a broader ecosystem that extends beyond the scientific workflow itself. Materials research is closely tied to supply chains for precursors, consumables, instruments, and software, as well as to funding mechanisms, certification procedures, and downstream industrial deployment. These external factors may strongly constrain what an agent can realistically propose or execute. A scientifically valid plan may still fail in practice due to unavailable materials, incompatible equipment, restricted software access, limited project budgets, or unmet regulatory requirements. At the same time, this broader integration opens an important opportunity: agentic MSE could evolve from optimizing isolated scientific tasks to coordinating science with operations. This includes resource-aware planning, procurement-aware experiment scheduling, traceable documentation for certification, and decision support for technology transfer into industrial settings. Accordingly, a major future direction is to develop ecosystem-aware agents that can reason not only over materials knowledge and laboratory feedback, but also over the logistical, economic, and regulatory contexts in which materials innovation actually unfolds. In this sense, higher autonomy can also be defined by the ability to remain actionable under real-world supply, budgetary, and regulatory constraints.</p>
        </sec>
      </sec>
    </sec>
    <sec id="sec5">
      <title>CONCLUSIONS</title>
      <p>This survey reviewed the fast-growing landscape of agentic MSE from a systems view, where agents connect data resources, computational tools, and (in some cases) experimental hardware into unified workflows. To describe this transition in a consistent way, we proposed a six-level autonomy framework and mapped it to five core task families in MSE. This task–level map helps move beyond “model lists” and instead shows what an agent can actually accomplish, what components it must integrate, and where key gaps remain.</p>
      <p>A central finding is that progress is uneven across tasks because each task family faces different limitations in reasoning, tool integration, and safety constraints. This unevenness also reflects a broader workflow shift: traditional MSE work has often been linear and organized into separate steps, with humans manually linking high-level reasoning to low-level execution; agentic workflows aim to close this gap through unified reasoning and planning. Importantly, as autonomy increases, task boundaries become less clear: higher-level agents tend to combine multiple tasks into a unified process.</p>
      <p>A brief cross-task comparison at Level 3 shows why a task–level lens is necessary. Although multi-agent coordination emerges across tasks, the bottlenecks differ: simulation tasks focus on the stable orchestration of long tool chains, information tasks emphasize evidence grounding and scientific validity, and synthesis/characterization tasks are limited mainly by hardware interfaces, sensing capabilities, and experimental variability.</p>
      <p>Looking ahead, the long-term goal is Level 5 autonomy, but the path forward is not only “more capable models”. It requires several system-level advances, including physically grounded intelligence, stronger active perception and embodied interaction, improved evaluation methods for long-horizon autonomy, and clearer safety and governance rules (including equity of access). In this sense, the six-level framework and the task–level map serve as practical guides: they make progress measurable, clarify what “higher autonomy” demands in each task family, and support a systematic transition from isolated tools to reliable human–AI collaboration in real-world MSE workflows.</p>
    </sec>
  </body>
  <back>
    <sec>
      <title>DECLARATIONS</title>
      <sec>
        <title>Acknowledgments</title>
        <p>The authors would like to acknowledge Flaticon (<uri xlink:href="https://www.flaticon.com/">https://www.flaticon.com/</uri>) and IconPark (<uri xlink:href="https://iconpark.oceanengine.com/">https://iconpark.oceanengine.com/</uri>) for providing the icons and graphical assets used in the figures of this manuscript.</p>
      </sec>
      <sec>
        <title>Authors’ contributions</title>
        <p>Conceptualization and design of the review: Luo, Y.; Zhang, T.; Zhu, J.; Zhang, L.</p>
        <p>Writing - manuscript: Zhu, J.; Zhang, L.; Zhu, Y.</p>
        <p>Writing - review and editing: Lin, X.; Wu, Y.; Di, S.; Liu, B.</p>
        <p>Supervision: Luo, Y.; Zhang, T.; Di, S.; Liu, B.</p>
        <p>All authors reviewed and approved the final version of the manuscript.</p>
      </sec>
      <sec>
        <title>Availability of data and materials</title>
        <p>Not applicable.</p>
      </sec>
      <sec>
        <title>AI and AI-assisted tools statement</title>
        <p>Not applicable.</p>
      </sec>
      <sec>
        <title>Financial support and sponsorship</title>
        <p>This work is supported by National Key R&amp;D Program of China (No. 2025ZD0619400) and by the Guangzhou-HKUST (GZ) Joint Funding Program (No. 2023A03J0003).</p>
      </sec>
      <sec>
        <title>Conflicts of interest</title>
        <p>Zhang, T. is the Editor-in-Chief of <italic>Journal of Materials Informatics</italic>, but was not involved in any stage of the editorial process, notably including reviewer selection, manuscript handling, or decision making. The other authors declared that there are no conflicts of interest.</p>
      </sec>
      <sec>
        <title>Ethical approval and consent to participate</title>
        <p>Not applicable.</p>
      </sec>
      <sec>
        <title>Consent for publication</title>
        <p>Not applicable.</p>
      </sec>
      <sec>
        <title>Copyright</title>
        <p>© The Author(s) 2026.</p>
      </sec>
    </sec>
    <ref-list>
      <ref id="B1">
        <label>1</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Gao</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Tan</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Research on text mining of material science based on natural language processing</article-title>
          <source>IOP Conf Ser Mater Sci Eng</source>
          <year>2020</year>
          <volume>768</volume>
          <fpage>072094</fpage>
          <pub-id pub-id-type="doi">10.1088/1757-899x/768/7/072094</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B2">
        <label>2</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Gupta</surname>
              <given-names>V</given-names>
            </name>
            <name>
              <surname>Kilic</surname>
              <given-names>MNT</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Hybrid-LLM-GNN: integrating large language models and graph neural networks for enhanced materials property prediction</article-title>
          <source>Digit Discov</source>
          <year>2025</year>
          <volume>4</volume>
          <fpage>376</fpage>
          <lpage>83</lpage>
          <pub-id pub-id-type="doi">10.1039/d4dd00199k</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B3">
        <label>3</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Olivetti</surname>
              <given-names>EA</given-names>
            </name>
            <name>
              <surname>Cole</surname>
              <given-names>JM</given-names>
            </name>
            <name>
              <surname>Kim</surname>
              <given-names>E</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Data-driven materials research enabled by natural language processing and information extraction</article-title>
          <source>Appl Phys Rev</source>
          <year>2020</year>
          <volume>7</volume>
          <fpage>041317</fpage>
          <pub-id pub-id-type="doi">10.1063/5.0021106</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B4">
        <label>4</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Reiser</surname>
              <given-names>P</given-names>
            </name>
            <name>
              <surname>Neubert</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Eberhard</surname>
              <given-names>A</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Graph neural networks for materials science and chemistry</article-title>
          <source>Commun Mater</source>
          <year>2022</year>
          <volume>3</volume>
          <fpage>93</fpage>
          <pub-id pub-id-type="doi">10.1038/s43246-022-00315-6</pub-id>
          <pub-id pub-id-type="pmid">36468086</pub-id>
          <pub-id pub-id-type="pmcid">PMC9702700</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B5">
        <label>5</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Venugopal</surname>
              <given-names>V</given-names>
            </name>
            <name>
              <surname>Sahoo</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Zaki</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Agarwal</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Gosvami</surname>
              <given-names>NN</given-names>
            </name>
            <name>
              <surname>Krishnan</surname>
              <given-names>NMA</given-names>
            </name>
          </person-group>
          <article-title>Looking through glass: knowledge discovery from materials science literature using natural language processing</article-title>
          <source>Patterns</source>
          <year>2021</year>
          <volume>2</volume>
          <fpage>100290</fpage>
          <pub-id pub-id-type="doi">10.1016/j.patter.2021.100290</pub-id>
          <pub-id pub-id-type="pmid">34286304</pub-id>
          <pub-id pub-id-type="pmcid">PMC8276010</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B6">
        <label>6</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Yoshitake</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Sato</surname>
              <given-names>F</given-names>
            </name>
            <name>
              <surname>Kawano</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Teraoka</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>MaterialBERT for natural language processing of materials science texts</article-title>
          <source>Sci Technol Adv Mater Methods</source>
          <year>2022</year>
          <volume>2</volume>
          <fpage>372</fpage>
          <lpage>80</lpage>
          <pub-id pub-id-type="doi">10.1080/27660400.2022.2124831</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B7">
        <label>7</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Kim</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Kang</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Yoo</surname>
              <given-names>J</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Deep-learning-based inverse design model for intelligent discovery of organic molecules</article-title>
          <source>npj Comput Mater</source>
          <year>2018</year>
          <volume>4</volume>
          <fpage>67</fpage>
          <pub-id pub-id-type="doi">10.1038/s41524-018-0128-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B8">
        <label>8</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Zhu</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Rodrigues</surname>
              <given-names>SP</given-names>
            </name>
            <name>
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Cai</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Generative model for the inverse design of metasurfaces</article-title>
          <source>Nano Lett</source>
          <year>2018</year>
          <volume>18</volume>
          <fpage>6570</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1021/acs.nanolett.8b03171</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B9">
        <label>9</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Curtarolo</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Hart</surname>
              <given-names>GLW</given-names>
            </name>
            <name>
              <surname>Nardelli</surname>
              <given-names>MB</given-names>
            </name>
            <name>
              <surname>Mingo</surname>
              <given-names>N</given-names>
            </name>
            <name>
              <surname>Sanvito</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Levy</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>The high-throughput highway to computational materials design</article-title>
          <source>Nat Mater</source>
          <year>2013</year>
          <volume>12</volume>
          <fpage>191</fpage>
          <lpage>201</lpage>
          <pub-id pub-id-type="doi">10.1038/nmat3568</pub-id>
          <pub-id pub-id-type="pmid">23422720</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B10">
        <label>10</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Hachmann</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Olivares-Amaya</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Atahan-Evrenk</surname>
              <given-names>S</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>The Harvard Clean Energy Project: large-scale computational screening and design of organic photovoltaics on the world community grid</article-title>
          <source>J Phys Chem Lett</source>
          <year>2011</year>
          <volume>2</volume>
          <fpage>2241</fpage>
          <lpage>51</lpage>
          <pub-id pub-id-type="doi">10.1021/jz200866s</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B11">
        <label>11</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Kanal</surname>
              <given-names>IY</given-names>
            </name>
            <name>
              <surname>Owens</surname>
              <given-names>SG</given-names>
            </name>
            <name>
              <surname>Bechtel</surname>
              <given-names>JS</given-names>
            </name>
            <name>
              <surname>Hutchison</surname>
              <given-names>GR</given-names>
            </name>
          </person-group>
          <article-title>Efficient computational screening of organic polymer photovoltaics</article-title>
          <source>J Phys Chem Lett</source>
          <year>2013</year>
          <volume>4</volume>
          <fpage>1613</fpage>
          <lpage>23</lpage>
          <pub-id pub-id-type="doi">10.1021/jz400215j</pub-id>
          <pub-id pub-id-type="pmid">26282968</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B12">
        <label>12</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Ansari</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Moosavi</surname>
              <given-names>SM</given-names>
            </name>
          </person-group>
          <article-title>Agent-based learning of materials datasets from the scientific literature</article-title>
          <source>Digit Discov</source>
          <year>2024</year>
          <volume>3</volume>
          <fpage>2607</fpage>
          <lpage>17</lpage>
          <pub-id pub-id-type="doi">10.1039/d4dd00252k</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B13">
        <label>13</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Ghafarollahi</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Buehler</surname>
              <given-names>MJ</given-names>
            </name>
          </person-group>
          <article-title>Rapid and automated alloy design with graph neural network-powered large language model-driven multi-agent AI</article-title>
          <source>MRS Bull</source>
          <year>2025</year>
          <volume>50</volume>
          <fpage>1309</fpage>
          <lpage>24</lpage>
          <pub-id pub-id-type="doi">10.1557/s43577-025-00953-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B14">
        <label>14</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Song</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Hou</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Miret</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <comment>HoneyComb: a flexible LLM-based agent system for materials science. In <italic>Findings of the Association for Computational Linguistics: EMNLP 2024</italic>, 2024 Oct; Miami, USA. Association for Computational Linguistics; 2024. pp. 3369-82.</comment>
          <pub-id pub-id-type="doi">10.18653/v1/2024.findings-emnlp.192</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B15">
        <label>15</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Bazgir</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Praneeth Madugula</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <comment>Multicrossmodal automated agent for integrating diverse materials science data. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2505.15132. <uri xlink:href="https://doi.org/10.48550/arXiv.2505.15132">https://doi.org/10.48550/arXiv.2505.15132</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B16">
        <label>16</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Zhou</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Ling</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Yan</surname>
              <given-names>K</given-names>
            </name>
            <etal />
          </person-group>
          <comment>Toward greater autonomy in materials discovery agents: unifying planning, physics, and scientists. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2506.05616. <uri xlink:href="https://doi.org/10.48550/arXiv.2506.05616">https://doi.org/10.48550/arXiv.2506.05616</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B17">
        <label>17</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Boiko</surname>
              <given-names>DA</given-names>
            </name>
            <name>
              <surname>Macknight</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Kline</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Gomes</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Autonomous chemical research with large language models</article-title>
          <source>Nature</source>
          <year>2023</year>
          <volume>624</volume>
          <fpage>570</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1038/s41586-023-06792-0</pub-id>
          <pub-id pub-id-type="pmid">38123806</pub-id>
          <pub-id pub-id-type="pmcid">PMC10733136</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B18">
        <label>18</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Szymanski</surname>
              <given-names>NJ</given-names>
            </name>
            <name>
              <surname>Rendy</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Fei</surname>
              <given-names>Y</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>An autonomous laboratory for the accelerated synthesis of inorganic materials</article-title>
          <source>Nature</source>
          <year>2023</year>
          <volume>624</volume>
          <fpage>86</fpage>
          <lpage>91</lpage>
          <pub-id pub-id-type="doi">10.1038/s41586-023-06734-w</pub-id>
          <pub-id pub-id-type="pmid">38030721</pub-id>
          <pub-id pub-id-type="pmcid">PMC10700133</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B19">
        <label>19</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Khan</surname>
              <given-names>SA</given-names>
            </name>
            <name>
              <surname>Mahmud</surname>
              <given-names>A</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Exploring the role of large language models in the scientific method: from hypothesis to discovery</article-title>
          <source>npj Artif Intell</source>
          <year>2025</year>
          <volume>1</volume>
          <fpage>14</fpage>
          <pub-id pub-id-type="doi">10.1038/s44387-025-00019-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B20">
        <label>20</label>
        <nlm-citation publication-type="book">
          <comment>SAE Standard. J3016_202104 - Taxonomy and definitions for terms related to driving automation systems for on-road motor vehicles. 2021.</comment>
          <pub-id pub-id-type="doi">10.4271/J3016_202104</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B21">
        <label>21</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Schilling-Wilhelmi</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Ríos-García</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Shabih</surname>
              <given-names>S</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>From text to insight: large language models for chemical data extraction</article-title>
          <source>Chem Soc Rev</source>
          <year>2025</year>
          <volume>54</volume>
          <fpage>1125</fpage>
          <lpage>50</lpage>
          <pub-id pub-id-type="doi">10.1039/d4cs00913d</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B22">
        <label>22</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Ramos</surname>
              <given-names>MC</given-names>
            </name>
            <name>
              <surname>Collison</surname>
              <given-names>CJ</given-names>
            </name>
            <name>
              <surname>White</surname>
              <given-names>AD</given-names>
            </name>
          </person-group>
          <article-title>A review of large language models and autonomous agents in chemistry</article-title>
          <source>Chem Sci</source>
          <year>2025</year>
          <volume>16</volume>
          <fpage>2514</fpage>
          <lpage>72</lpage>
          <pub-id pub-id-type="doi">10.1039/d4sc03921a</pub-id>
          <pub-id pub-id-type="pmid">39829984</pub-id>
          <pub-id pub-id-type="pmcid">PMC11739813</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B23">
        <label>23</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Wei</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Schuurmans</surname>
              <given-names>D</given-names>
            </name>
            <etal />
          </person-group>
          <comment>Chain-of-thought prompting elicits reasoning in large language models. <italic>arXiv</italic> <bold>2022</bold>, arXiv:2201.11903. <uri xlink:href="https://doi.org/10.48550/arXiv.2201.11903">https://doi.org/10.48550/arXiv.2201.11903</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B24">
        <label>24</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Dai</surname>
              <given-names>Q</given-names>
            </name>
            <name>
              <surname>Bo</surname>
              <given-names>X</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>A survey on the memory mechanism of large language model-based agents</article-title>
          <source>ACM Trans Inf Syst</source>
          <year>2025</year>
          <volume>43</volume>
          <fpage>1</fpage>
          <lpage>47</lpage>
          <pub-id pub-id-type="doi">10.1145/3748302</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B25">
        <label>25</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Sim</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Vakili</surname>
              <given-names>MG</given-names>
            </name>
            <name>
              <surname>Strieth-Kalthoff</surname>
              <given-names>F</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>ChemOS 2.0: an orchestration architecture for chemical self-driving laboratories</article-title>
          <source>Matter</source>
          <year>2024</year>
          <volume>7</volume>
          <fpage>2959</fpage>
          <lpage>77</lpage>
          <pub-id pub-id-type="doi">10.1016/j.matt.2024.04.022</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B26">
        <label>26</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Schmidgall</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Su</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <etal />
          </person-group>
          <comment>Agent laboratory: using LLM agents as research assistants. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2501.04227. <uri xlink:href="https://doi.org/10.48550/arXiv.2501.04227">https://doi.org/10.48550/arXiv.2501.04227</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B27">
        <label>27</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Kapoor</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Stroebl</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Siegel</surname>
              <given-names>ZS</given-names>
            </name>
            <name>
              <surname>Nadgir</surname>
              <given-names>N</given-names>
            </name>
            <name>
              <surname>Narayanan</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <comment>AI agents that matter. <italic>arXiv</italic> <bold>2024</bold>, arXiv:2407.01502. <uri xlink:href="https://doi.org/10.48550/arXiv.2407.01502">https://doi.org/10.48550/arXiv.2407.01502</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B28">
        <label>28</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Lu</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Lu</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Lange</surname>
              <given-names>RT</given-names>
            </name>
            <name>
              <surname>Foerster</surname>
              <given-names>JN</given-names>
            </name>
            <name>
              <surname>Clune</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Ha</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <comment>The AI scientist: towards fully automated open-ended scientific discovery. <italic>arXiv</italic> <bold>2024</bold>, arXiv:2408.06292. <uri xlink:href="https://doi.org/10.48550/arXiv.2408.06292">https://doi.org/10.48550/arXiv.2408.06292</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B29">
        <label>29</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Szymanski</surname>
              <given-names>NJ</given-names>
            </name>
            <name>
              <surname>Bartel</surname>
              <given-names>CJ</given-names>
            </name>
            <name>
              <surname>Zeng</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Diallo</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Kim</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Ceder</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Adaptively driven X-ray diffraction guided by machine learning for autonomous phase identification</article-title>
          <source>npj Comput Mater</source>
          <year>2023</year>
          <volume>9</volume>
          <fpage>31</fpage>
          <pub-id pub-id-type="doi">10.1038/s41524-023-00984-y</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B30">
        <label>30</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Kumbhar</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Mishra</surname>
              <given-names>V</given-names>
            </name>
            <name>
              <surname>Coutinho</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Handa</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Iquebal</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Baral</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <comment>Hypothesis generation for materials discovery and design using goal-driven and constraint-guided LLM agents. In <italic>Findings of the Association for Computational Linguistics: NAACL 2025</italic>, 2025 Mar; Albuquerque, New Mexico. Association for Computational Linguistics; 2025. pp. 7524-55.</comment>
          <pub-id pub-id-type="doi">10.18653/v1/2025.findings-naacl.420</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B31">
        <label>31</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Shi</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Knowledge-driven autonomous materials research via collaborative multi-agent and robotic system</article-title>
          <source>Matter</source>
          <year>2026</year>
          <volume>9</volume>
          <fpage>102577</fpage>
          <pub-id pub-id-type="doi">10.1016/j.matt.2025.102577</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B32">
        <label>32</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Pyzer-Knapp</surname>
              <given-names>EO</given-names>
            </name>
            <name>
              <surname>Manica</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Staar</surname>
              <given-names>P</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Foundation models for materials discovery - current state and future directions</article-title>
          <source>npj Comput Mater</source>
          <year>2025</year>
          <volume>11</volume>
          <fpage>61</fpage>
          <pub-id pub-id-type="doi">10.1038/s41524-025-01538-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B33">
        <label>33</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Mishra</surname>
              <given-names>V</given-names>
            </name>
            <name>
              <surname>Singh</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Ahlawat</surname>
              <given-names>D</given-names>
            </name>
            <etal />
          </person-group>
          <comment>Foundational large language models for materials research. <italic>arXiv</italic> <bold>2024</bold>, arXiv:2412.09560. <uri xlink:href="https://doi.org/10.48550/arXiv.2412.09560">https://doi.org/10.48550/arXiv.2412.09560</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B34">
        <label>34</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Choi</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Nam</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Choi</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Jung</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>A perspective on foundation models in chemistry</article-title>
          <source>JACS Au</source>
          <year>2025</year>
          <volume>5</volume>
          <fpage>1499</fpage>
          <lpage>518</lpage>
          <pub-id pub-id-type="doi">10.1021/jacsau.4c01160</pub-id>
          <pub-id pub-id-type="pmid">40313808</pub-id>
          <pub-id pub-id-type="pmcid">PMC12042027</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B35">
        <label>35</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Van</surname>
              <given-names>MH</given-names>
            </name>
            <name>
              <surname>Verma</surname>
              <given-names>P</given-names>
            </name>
            <name>
              <surname>Zhao</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Wu</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <comment>A survey of AI for materials science: foundation models, LLM agents, datasets, and tools. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2506.20743. <uri xlink:href="https://doi.org/10.48550/arXiv.2506.20743">https://doi.org/10.48550/arXiv.2506.20743</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B36">
        <label>36</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Li</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Ran</surname>
              <given-names>N</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Agentic material science</article-title>
          <source>J Mater Inf</source>
          <year>2026</year>
          <volume>6</volume>
          <fpage>10</fpage>
          <pub-id pub-id-type="doi">10.20517/jmi.2025.87</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B37">
        <label>37</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Tom</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Schmid</surname>
              <given-names>SP</given-names>
            </name>
            <name>
              <surname>Baird</surname>
              <given-names>SG</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Self-driving laboratories for chemistry and materials science</article-title>
          <source>Chem Rev</source>
          <year>2024</year>
          <volume>124</volume>
          <fpage>9633</fpage>
          <lpage>732</lpage>
          <pub-id pub-id-type="doi">10.1021/acs.chemrev.4c00055</pub-id>
          <pub-id pub-id-type="pmid">39137296</pub-id>
          <pub-id pub-id-type="pmcid">PMC11363023</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B38">
        <label>38</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Anstine</surname>
              <given-names>DM</given-names>
            </name>
            <name>
              <surname>Isayev</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>Generative models as an emerging paradigm in the chemical sciences</article-title>
          <source>J Am Chem Soc</source>
          <year>2023</year>
          <volume>145</volume>
          <fpage>8736</fpage>
          <lpage>50</lpage>
          <pub-id pub-id-type="doi">10.1021/jacs.2c13467</pub-id>
          <pub-id pub-id-type="pmid">37052978</pub-id>
          <pub-id pub-id-type="pmcid">PMC10141264</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B39">
        <label>39</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Bran</surname>
              <given-names>AM</given-names>
            </name>
            <name>
              <surname>Cox</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Schilter</surname>
              <given-names>O</given-names>
            </name>
            <name>
              <surname>Baldassari</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>White</surname>
              <given-names>AD</given-names>
            </name>
            <name>
              <surname>Schwaller</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Augmenting large language models with chemistry tools</article-title>
          <source>Nat Mach Intell</source>
          <year>2024</year>
          <volume>6</volume>
          <fpage>525</fpage>
          <lpage>35</lpage>
          <pub-id pub-id-type="doi">10.1038/s42256-024-00832-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B40">
        <label>40</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Gupta</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Zaki</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Krishnan</surname>
              <given-names>NMA</given-names>
            </name>
            <name>
              <surname>Mausam</surname>
              <given-names />
            </name>
          </person-group>
          <article-title>MatSciBERT: a materials domain language model for text mining and information extraction</article-title>
          <source>npj Comput Mater</source>
          <year>2022</year>
          <volume>8</volume>
          <fpage>102</fpage>
          <pub-id pub-id-type="doi">10.1038/s41524-022-00784-w</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B41">
        <label>41</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Trewartha</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Walker</surname>
              <given-names>N</given-names>
            </name>
            <name>
              <surname>Huo</surname>
              <given-names>H</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Quantifying the advantage of domain-specific pre-training on named entity recognition tasks in materials science</article-title>
          <source>Patterns</source>
          <year>2022</year>
          <volume>3</volume>
          <fpage>100488</fpage>
          <pub-id pub-id-type="doi">10.1016/j.patter.2022.100488</pub-id>
          <pub-id pub-id-type="pmid">35465225</pub-id>
          <pub-id pub-id-type="pmcid">PMC9024010</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B42">
        <label>42</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Ott</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Goyal</surname>
              <given-names>N</given-names>
            </name>
            <etal />
          </person-group>
          <comment>RoBERTa: a robustly optimized BERT pretraining approach. <italic>arXiv</italic> <bold>2019</bold>, arXiv:1907.11692. <uri xlink:href="https://doi.org/10.48550/arXiv.1907.11692">https://doi.org/10.48550/arXiv.1907.11692</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B43">
        <label>43</label>
        <nlm-citation publication-type="journal">
          <article-title>Niyongabo Rubungo, A.; Arnold, C.; Rand, B. P.; Dieng, A. B. LLM-Prop: predicting the properties of crystalline materials using large language models</article-title>
          <source>npj Comput Mater</source>
          <year>2025</year>
          <volume>11</volume>
          <fpage>186</fpage>
          <pub-id pub-id-type="doi">10.1038/s41524-025-01536-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B44">
        <label>44</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Yu</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Baker</surname>
              <given-names>FN</given-names>
            </name>
            <name>
              <surname>Chen</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Ning</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Sun</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <comment>LlaSMol: advancing large language models for chemistry with a large-scale, comprehensive, high-quality instruction tuning dataset. <italic>arXiv</italic> <bold>2024</bold>, arXiv:2402.09391. <uri xlink:href="https://doi.org/10.48550/arXiv.2402.09391">https://doi.org/10.48550/arXiv.2402.09391</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B45">
        <label>45</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Qiu</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Zhao</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Jing</surname>
              <given-names>E</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Introducing PolySea: an LLM-based polymer smart evolution agent</article-title>
          <source>ChemRxiv</source>
          <year>2025</year>
          <pub-id pub-id-type="doi">10.26434/chemrxiv-2025-zw65g</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B46">
        <label>46</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Tian</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Jiang</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Steel design based on a large language model</article-title>
          <source>Acta Mater</source>
          <year>2025</year>
          <volume>285</volume>
          <fpage>120663</fpage>
          <pub-id pub-id-type="doi">10.1016/j.actamat.2024.120663</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B47">
        <label>47</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Lv</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Shu</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Xiao</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Incorporating molecular knowledge in large language models via multimodal modeling</article-title>
          <source>IEEE Trans Comput Soc Syst</source>
          <year>2025</year>
          <volume>12</volume>
          <fpage>3660</fpage>
          <lpage>70</lpage>
          <pub-id pub-id-type="doi">10.1109/tcss.2024.3506158</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B48">
        <label>48</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Zholus</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Kuznetsov</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Schutski</surname>
              <given-names>R</given-names>
            </name>
            <etal />
          </person-group>
          <comment>BindGPT: a scalable framework for 3D molecular design via language modeling and reinforcement learning. <italic>arXiv</italic> <bold>2024</bold>, arXiv:2406.03686. <uri xlink:href="https://doi.org/10.48550/arXiv.2406.03686">https://doi.org/10.48550/arXiv.2406.03686</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B49">
        <label>49</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Tan</surname>
              <given-names>Q</given-names>
            </name>
            <name>
              <surname>Zhou</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Xia</surname>
              <given-names>P</given-names>
            </name>
            <etal />
          </person-group>
          <comment>ChemMLLM: chemical multimodal large language model. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2505.16326. <uri xlink:href="https://doi.org/10.48550/arXiv.2505.16326">https://doi.org/10.48550/arXiv.2505.16326</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B50">
        <label>50</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Kuenneth</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Ramprasad</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>polyBERT: a chemical language model to enable fully machine-driven ultrafast polymer informatics</article-title>
          <source>Nat Commun</source>
          <year>2023</year>
          <volume>14</volume>
          <fpage>4099</fpage>
          <pub-id pub-id-type="doi">10.1038/s41467-023-39868-6</pub-id>
          <pub-id pub-id-type="pmid">37433807</pub-id>
          <pub-id pub-id-type="pmcid">PMC10336012</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B51">
        <label>51</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Xu</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Barati Farimani</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>TransPolymer: a Transformer-based language model for polymer property predictions</article-title>
          <source>npj Comput Mater</source>
          <year>2023</year>
          <volume>9</volume>
          <fpage>64</fpage>
          <pub-id pub-id-type="doi">10.1038/s41524-023-01016-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B52">
        <label>52</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Chaudhari</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Guntuboina</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Huang</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Farimani</surname>
              <given-names>AB</given-names>
            </name>
          </person-group>
          <article-title>AlloyBERT: alloy property prediction with large language models</article-title>
          <source>Comput Mater Sci</source>
          <year>2024</year>
          <volume>244</volume>
          <fpage>113256</fpage>
          <pub-id pub-id-type="doi">10.1016/j.commatsci.2024.113256</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B53">
        <label>53</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Sun</surname>
              <given-names>P</given-names>
            </name>
            <name>
              <surname>Chen</surname>
              <given-names>S</given-names>
            </name>
            <etal />
          </person-group>
          <comment>Perovskite-LLM: knowledge-enhanced large language models for perovskite solar cell research. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2502.12669. <uri xlink:href="https://doi.org/10.48550/arXiv.2502.12669">https://doi.org/10.48550/arXiv.2502.12669</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B54">
        <label>54</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Huang</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Cole</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>BatteryBERT: a pretrained language model for battery database enhancement</article-title>
          <source>J Chem Inf Model</source>
          <year>2022</year>
          <volume>62</volume>
          <fpage>6365</fpage>
          <lpage>77</lpage>
          <pub-id pub-id-type="doi">10.1021/acs.jcim.2c00035</pub-id>
          <pub-id pub-id-type="pmid">35533012</pub-id>
          <pub-id pub-id-type="pmcid">PMC9795558</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B55">
        <label>55</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhao</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Huang</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Cole</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>OpticalBERT and OpticalTable-SQA: text- and table-based language models for the optical-materials domain</article-title>
          <source>J Chem Inf Model</source>
          <year>2023</year>
          <volume>63</volume>
          <fpage>1961</fpage>
          <lpage>81</lpage>
          <pub-id pub-id-type="doi">10.1021/acs.jcim.2c01259</pub-id>
          <pub-id pub-id-type="pmid">36940385</pub-id>
          <pub-id pub-id-type="pmcid">PMC10091421</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B56">
        <label>56</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Mok</surname>
              <given-names>DH</given-names>
            </name>
            <name>
              <surname>Back</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Generative pretrained transformer for heterogeneous catalysts</article-title>
          <source>J Am Chem Soc</source>
          <year>2024</year>
          <volume>146</volume>
          <fpage>33712</fpage>
          <lpage>22</lpage>
          <pub-id pub-id-type="doi">10.1021/jacs.4c11504</pub-id>
          <pub-id pub-id-type="pmid">39576215</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B57">
        <label>57</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Tang</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Xu</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Cao</surname>
              <given-names>J</given-names>
            </name>
            <etal />
          </person-group>
          <comment>MatterChat: a multi-modal LLM for material science. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2502.13107. <uri xlink:href="https://doi.org/10.48550/arXiv.2502.13107">https://doi.org/10.48550/arXiv.2502.13107</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B58">
        <label>58</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Antunes</surname>
              <given-names>LM</given-names>
            </name>
            <name>
              <surname>Butler</surname>
              <given-names>KT</given-names>
            </name>
            <name>
              <surname>Grau-Crespo</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Crystal structure generation with autoregressive large language modeling</article-title>
          <source>Nat Commun</source>
          <year>2024</year>
          <volume>15</volume>
          <fpage>10570</fpage>
          <pub-id pub-id-type="doi">10.1038/s41467-024-54639-7</pub-id>
          <pub-id pub-id-type="pmid">39643601</pub-id>
          <pub-id pub-id-type="pmcid">PMC11624194</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B59">
        <label>59</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Shi</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>BatGPT-Chem: a foundation large model for chemical engineering</article-title>
          <source>Research</source>
          <year>2025</year>
          <volume>8</volume>
          <fpage>0827</fpage>
          <pub-id pub-id-type="doi">10.34133/research.0827</pub-id>
          <pub-id pub-id-type="pmid">40936797</pub-id>
          <pub-id pub-id-type="pmcid">PMC12421729</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B60">
        <label>60</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Jain</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Ong</surname>
              <given-names>SP</given-names>
            </name>
            <name>
              <surname>Hautier</surname>
              <given-names>G</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Commentary: The Materials Project: a materials genome approach to accelerating materials innovation</article-title>
          <source>APL Mater</source>
          <year>2013</year>
          <volume>1</volume>
          <fpage>011002</fpage>
          <pub-id pub-id-type="doi">10.1063/1.4812323</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B61">
        <label>61</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Talirz</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Kumbhar</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Passaro</surname>
              <given-names>E</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Materials Cloud, a platform for open computational science</article-title>
          <source>Sci Data</source>
          <year>2020</year>
          <volume>7</volume>
          <fpage>299</fpage>
          <pub-id pub-id-type="doi">10.1038/s41597-020-00637-5</pub-id>
          <pub-id pub-id-type="pmid">32901046</pub-id>
          <pub-id pub-id-type="pmcid">PMC7479138</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B62">
        <label>62</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Scheidgen</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Himanen</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Ladines</surname>
              <given-names>AN</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>NOMAD: a distributed web-based platform for managing materials science research data</article-title>
          <source>J Open Source Softw</source>
          <year>2023</year>
          <volume>8</volume>
          <fpage>5388</fpage>
          <pub-id pub-id-type="doi">10.21105/joss.05388</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B63">
        <label>63</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Esters</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Oses</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Divilov</surname>
              <given-names>S</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>aflow.org: a web ecosystem of databases, software and tools</article-title>
          <source>Comput Mater Sci</source>
          <year>2023</year>
          <volume>216</volume>
          <fpage>111808</fpage>
          <pub-id pub-id-type="doi">10.1016/j.commatsci.2022.111808</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B64">
        <label>64</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Venugopal</surname>
              <given-names>V</given-names>
            </name>
            <name>
              <surname>Olivetti</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>MatKG: an autonomously generated knowledge graph in Material Science</article-title>
          <source>Sci Data</source>
          <year>2024</year>
          <volume>11</volume>
          <fpage>217</fpage>
          <pub-id pub-id-type="doi">10.1038/s41597-024-03039-z</pub-id>
          <pub-id pub-id-type="pmid">38368452</pub-id>
          <pub-id pub-id-type="pmcid">PMC10874416</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B65">
        <label>65</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Chen</surname>
              <given-names>F</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>A materials terminology knowledge graph automatically constructed from text corpus</article-title>
          <source>Sci Data</source>
          <year>2024</year>
          <volume>11</volume>
          <fpage>600</fpage>
          <pub-id pub-id-type="doi">10.1038/s41597-024-03448-0</pub-id>
          <pub-id pub-id-type="pmid">38849436</pub-id>
          <pub-id pub-id-type="pmcid">PMC11161478</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B66">
        <label>66</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Statt</surname>
              <given-names>MJ</given-names>
            </name>
            <name>
              <surname>Rohr</surname>
              <given-names>BA</given-names>
            </name>
            <name>
              <surname>Guevarra</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Breeden</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Suram</surname>
              <given-names>SK</given-names>
            </name>
            <name>
              <surname>Gregoire</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>The materials experiment knowledge graph</article-title>
          <source>Digit Discov</source>
          <year>2023</year>
          <volume>2</volume>
          <fpage>909</fpage>
          <lpage>14</lpage>
          <pub-id pub-id-type="doi">10.1039/d3dd00067b</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B67">
        <label>67</label>
        <nlm-citation publication-type="web">
          <comment>MongoDB Inc. MongoDB: the world’s leading modern data platform. <uri xlink:href="https://www.mongodb.com/">https://www.mongodb.com/</uri>. (accessed 2026-05-18)</comment>
        </nlm-citation>
      </ref>
      <ref id="B68">
        <label>68</label>
        <nlm-citation publication-type="web">
          <comment>PostgreSQL: the world’s most advanced open source relational database. <uri xlink:href="https://www.postgresql.org/">https://www.postgresql.org/</uri>. (accessed 2026-05-18)</comment>
        </nlm-citation>
      </ref>
      <ref id="B69">
        <label>69</label>
        <nlm-citation publication-type="web">
          <comment>Elementary Multiperspective Material Ontology (EMMO). 2025. <uri xlink:href="https://github.com/emmo-repo/EMMO">https://github.com/emmo-repo/EMMO</uri>. (accessed 2026-05-18)</comment>
        </nlm-citation>
      </ref>
      <ref id="B70">
        <label>70</label>
        <nlm-citation publication-type="book">
          <comment>de Sainte Marie, C.; Iglesias Escudero, M.; Rosina, P. The ONTORULE Project: where ontology meets business rules. In <italic>Web Reasoning and Rule Systems</italic>. RR 2011. Lecture Notes in Computer Science, vol 6902; Springer, Berlin, Heidelberg: 2011. pp. 24-9.</comment>
          <pub-id pub-id-type="doi">10.1007/978-3-642-23580-1_3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B71">
        <label>71</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Premkumar</surname>
              <given-names>V</given-names>
            </name>
            <name>
              <surname>Krishnamurty</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Wileden</surname>
              <given-names>JC</given-names>
            </name>
            <name>
              <surname>Grosse</surname>
              <given-names>IR</given-names>
            </name>
          </person-group>
          <article-title>A semantic knowledge management system for laminated composites</article-title>
          <source>Adv Eng Inform</source>
          <year>2014</year>
          <volume>28</volume>
          <fpage>91</fpage>
          <lpage>101</lpage>
          <pub-id pub-id-type="doi">10.1016/j.aei.2013.12.004</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B72">
        <label>72</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Douze</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Guzhva</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Deng</surname>
              <given-names>C</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>The Faiss library</article-title>
          <source>IEEE Trans Big Data</source>
          <year>2026</year>
          <volume>12</volume>
          <fpage>346</fpage>
          <lpage>61</lpage>
          <pub-id pub-id-type="doi">10.1109/tbdata.2025.3618474</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B73">
        <label>73</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Yi</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Guo</surname>
              <given-names>R</given-names>
            </name>
            <etal />
          </person-group>
          <comment>Milvus: a purpose-built vector data management system. In <italic>Proceedings of the 2021 International Conference on Management of Data</italic>. Association for Computing Machinery; 2021. pp. 2614-27.</comment>
          <pub-id pub-id-type="doi">10.1145/3448016.3457550</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B74">
        <label>74</label>
        <nlm-citation publication-type="web">
          <comment>Qdrant. 2025. <uri xlink:href="https://github.com/qdrant/qdrant">https://github.com/qdrant/qdrant</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B75">
        <label>75</label>
        <nlm-citation publication-type="web">
          <comment>Weaviate. 2025. <uri xlink:href="https://github.com/weaviate/weaviate">https://github.com/weaviate/weaviate</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B76">
        <label>76</label>
        <nlm-citation publication-type="web">
          <comment>Neo4j. Graph Intelligence Platform. 2026. <uri xlink:href="https://neo4j.com/">https://neo4j.com/</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B77">
        <label>77</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Krech</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Grimnes</surname>
              <given-names>GA</given-names>
            </name>
            <name>
              <surname>Higgins</surname>
              <given-names>G</given-names>
            </name>
            <etal />
          </person-group>
          <comment>RDFLib. 2023.</comment>
          <pub-id pub-id-type="doi">10.5281/zenodo.8206632</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B78">
        <label>78</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Packer</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Wooders</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Lin</surname>
              <given-names>K</given-names>
            </name>
            <etal />
          </person-group>
          <comment>MemGPT: towards LLMs as operating systems. <italic>arXiv</italic> <bold>2023</bold>, arXiv:2310.08560. <uri xlink:href="https://doi.org/10.48550/arXiv.2310.08560">https://doi.org/10.48550/arXiv.2310.08560</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B79">
        <label>79</label>
        <nlm-citation publication-type="web">
          <comment>LlamaIndex. 2026. <uri xlink:href="https://www.llamaindex.ai/">https://www.llamaindex.ai/</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B80">
        <label>80</label>
        <nlm-citation publication-type="web">
          <comment>Haystack. 2019. <uri xlink:href="https://github.com/deepset-ai/haystack">https://github.com/deepset-ai/haystack</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B81">
        <label>81</label>
        <nlm-citation publication-type="web">
          <comment>SerpApi: Google Search API. <uri xlink:href="https://serpapi.com/">https://serpapi.com/</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B82">
        <label>82</label>
        <nlm-citation publication-type="web">
          <comment>LangChain. 2022. <uri xlink:href="https://github.com/langchain-ai/langchain">https://github.com/langchain-ai/langchain</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B83">
        <label>83</label>
        <nlm-citation publication-type="web">
          <comment>Langgraph. 2025. <uri xlink:href="https://github.com/langchain-ai/langgraph">https://github.com/langchain-ai/langgraph</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B84">
        <label>84</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Wu</surname>
              <given-names>Q</given-names>
            </name>
            <name>
              <surname>Bansal</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <etal />
          </person-group>
          <comment>AutoGen: enabling next-gen LLM applications via multi-agent conversation. <italic>arXiv</italic> <bold>2023</bold>, arXiv:2308.08155. <uri xlink:href="https://doi.org/10.48550/arXiv.2308.08155">https://doi.org/10.48550/arXiv.2308.08155</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B85">
        <label>85</label>
        <nlm-citation publication-type="web">
          <comment>crewAI. 2025. <uri xlink:href="https://github.com/crewAIInc/crewAI">https://github.com/crewAIInc/crewAI</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B86">
        <label>86</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Yao</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Zhao</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Yu</surname>
              <given-names>D</given-names>
            </name>
            <etal />
          </person-group>
          <comment>ReAct: synergizing reasoning and acting in language models. <italic>arXiv</italic> <bold>2022</bold>, arXiv:2210.03629. <uri xlink:href="https://doi.org/10.48550/arXiv.2210.03629">https://doi.org/10.48550/arXiv.2210.03629</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B87">
        <label>87</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Shinn</surname>
              <given-names>N</given-names>
            </name>
            <name>
              <surname>Cassano</surname>
              <given-names>F</given-names>
            </name>
            <name>
              <surname>Berman</surname>
              <given-names>E</given-names>
            </name>
            <name>
              <surname>Gopinath</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Narasimhan</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Yao</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <comment>Reflexion: language agents with verbal reinforcement learning. <italic>arXiv</italic> <bold>2023</bold>, arXiv:2303.11366. <uri xlink:href="https://doi.org/10.48550/arXiv.2303.11366">https://doi.org/10.48550/arXiv.2303.11366</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B88">
        <label>88</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Jain</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Ong</surname>
              <given-names>SP</given-names>
            </name>
            <name>
              <surname>Chen</surname>
              <given-names>W</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>FireWorks: a dynamic workflow system designed for high‐throughput applications</article-title>
          <source>Concurr Comput Pract Exp</source>
          <year>2015</year>
          <volume>27</volume>
          <fpage>5037</fpage>
          <lpage>59</lpage>
          <pub-id pub-id-type="doi">10.1002/cpe.3505</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B89">
        <label>89</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Huber</surname>
              <given-names>SP</given-names>
            </name>
            <name>
              <surname>Zoupanos</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Uhrin</surname>
              <given-names>M</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>AiiDA 1.0, a scalable computational infrastructure for automated reproducible workflows and data provenance</article-title>
          <source>Sci Data</source>
          <year>2020</year>
          <volume>7</volume>
          <fpage>300</fpage>
          <pub-id pub-id-type="doi">10.1038/s41597-020-00638-4</pub-id>
          <pub-id pub-id-type="pmid">32901044</pub-id>
          <pub-id pub-id-type="pmcid">PMC7479590</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B90">
        <label>90</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Sundberg</surname>
              <given-names>JD</given-names>
            </name>
            <name>
              <surname>Benjamin</surname>
              <given-names>SS</given-names>
            </name>
            <name>
              <surname>Mcrae</surname>
              <given-names>LM</given-names>
            </name>
            <name>
              <surname>Warren</surname>
              <given-names>SC</given-names>
            </name>
          </person-group>
          <article-title>Simmate: a framework for materials science</article-title>
          <source>J Open Source Softw</source>
          <year>2022</year>
          <volume>7</volume>
          <fpage>4364</fpage>
          <pub-id pub-id-type="doi">10.21105/joss.04364</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B91">
        <label>91</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Ward</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Pauloski</surname>
              <given-names>JG</given-names>
            </name>
            <name>
              <surname>Hayot-Sasson</surname>
              <given-names>V</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Employing artificial intelligence to steer exascale workflows with colmena</article-title>
          <source>Int J High Perform Comput Appl</source>
          <year>2024</year>
          <volume>39</volume>
          <fpage>52</fpage>
          <lpage>64</lpage>
          <pub-id pub-id-type="doi">10.1177/10943420241288242</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B92">
        <label>92</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Ong</surname>
              <given-names>SP</given-names>
            </name>
            <name>
              <surname>Richards</surname>
              <given-names>WD</given-names>
            </name>
            <name>
              <surname>Jain</surname>
              <given-names>A</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Python Materials Genomics (pymatgen): A robust, open-source python library for materials analysis</article-title>
          <source>Comput Mater Sci</source>
          <year>2013</year>
          <volume>68</volume>
          <fpage>314</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1016/j.commatsci.2012.10.028</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B93">
        <label>93</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Hafner</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Kresse</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <comment>The Vienna AB-Initio Simulation Program VASP: an efficient and versatile tool for studying the structural, dynamic, and electronic properties of materials. In: Gonis, A.; Meike, A.; Turchi, P. E. A.; Editors. <italic>Properties of Complex Inorganic Solids</italic>. Springer US; 1997. pp. 69-82.</comment>
          <pub-id pub-id-type="doi">10.1007/978-1-4615-5943-6_10</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B94">
        <label>94</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Giannozzi</surname>
              <given-names>P</given-names>
            </name>
            <name>
              <surname>Baroni</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Bonini</surname>
              <given-names>N</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>QUANTUM ESPRESSO: a modular and open-source software project for quantum simulations of materials</article-title>
          <source>J Phys Condens Matter</source>
          <year>2009</year>
          <volume>21</volume>
          <fpage>395502</fpage>
          <pub-id pub-id-type="doi">10.1088/0953-8984/21/39/395502</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B95">
        <label>95</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Gonze</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Amadon</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Anglade</surname>
              <given-names>P</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>ABINIT: first-principles approach to material and nanosystem properties</article-title>
          <source>Comput Phys Commun</source>
          <year>2009</year>
          <volume>180</volume>
          <fpage>2582</fpage>
          <lpage>615</lpage>
          <pub-id pub-id-type="doi">10.1016/j.cpc.2009.07.007</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B96">
        <label>96</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Mortensen</surname>
              <given-names>JJ</given-names>
            </name>
            <name>
              <surname>Larsen</surname>
              <given-names>AH</given-names>
            </name>
            <name>
              <surname>Kuisma</surname>
              <given-names>M</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>GPAW: an open Python package for electronic structure calculations</article-title>
          <source>J Chem Phys</source>
          <year>2024</year>
          <volume>160</volume>
          <fpage>092503</fpage>
          <pub-id pub-id-type="doi">10.1063/5.0182685</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B97">
        <label>97</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Thompson</surname>
              <given-names>AP</given-names>
            </name>
            <name>
              <surname>Aktulga</surname>
              <given-names>HM</given-names>
            </name>
            <name>
              <surname>Berger</surname>
              <given-names>R</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>LAMMPS - a flexible simulation tool for particle-based materials modeling at the atomic, meso, and continuum scales</article-title>
          <source>Comput Phys Commun</source>
          <year>2022</year>
          <volume>271</volume>
          <fpage>108171</fpage>
          <pub-id pub-id-type="doi">10.1016/j.cpc.2021.108171</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B98">
        <label>98</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Abraham</surname>
              <given-names>MJ</given-names>
            </name>
            <name>
              <surname>Murtola</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Schulz</surname>
              <given-names>R</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>GROMACS: high performance molecular simulations through multi-level parallelism from laptops to supercomputers</article-title>
          <source>SoftwareX</source>
          <year>2015</year>
          <volume>1-2</volume>
          <fpage>19</fpage>
          <lpage>25</lpage>
          <pub-id pub-id-type="doi">10.1016/j.softx.2015.06.001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B99">
        <label>99</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Eastman</surname>
              <given-names>P</given-names>
            </name>
            <name>
              <surname>Galvelis</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Peláez</surname>
              <given-names>RP</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>OpenMM 8: molecular dynamics simulation with machine learning potentials</article-title>
          <source>J Phys Chem B</source>
          <year>2023</year>
          <volume>128</volume>
          <fpage>109</fpage>
          <lpage>16</lpage>
          <pub-id pub-id-type="doi">10.1021/acs.jpcb.3c06662</pub-id>
          <pub-id pub-id-type="pmid">38154096</pub-id>
          <pub-id pub-id-type="pmcid">PMC10846090</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B100">
        <label>100</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Grecco</surname>
              <given-names>HE</given-names>
            </name>
            <name>
              <surname>Dartiailh</surname>
              <given-names>MC</given-names>
            </name>
            <name>
              <surname>Thalhammer-Thurner</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Bronger</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Bauer</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>PyVISA: the Python instrumentation package</article-title>
          <source>J Open Source Softw</source>
          <year>2023</year>
          <volume>8</volume>
          <fpage>5304</fpage>
          <pub-id pub-id-type="doi">10.21105/joss.05304</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B101">
        <label>101</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Pyzer-Knapp</surname>
              <given-names>EO</given-names>
            </name>
            <name>
              <surname>Pitera</surname>
              <given-names>JW</given-names>
            </name>
            <name>
              <surname>Staar</surname>
              <given-names>PWJ</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Accelerating materials discovery using artificial intelligence, high performance computing and robotics</article-title>
          <source>npj Comput Mater</source>
          <year>2022</year>
          <volume>8</volume>
          <fpage>84</fpage>
          <pub-id pub-id-type="doi">10.1038/s41524-022-00765-z</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B102">
        <label>102</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Wierenga</surname>
              <given-names>RP</given-names>
            </name>
            <name>
              <surname>Golas</surname>
              <given-names>SM</given-names>
            </name>
            <name>
              <surname>Ho</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Coley</surname>
              <given-names>CW</given-names>
            </name>
            <name>
              <surname>Esvelt</surname>
              <given-names>KM</given-names>
            </name>
          </person-group>
          <article-title>PyLabRobot: an open-source, hardware agnostic interface for liquid-handling robots and accessories</article-title>
          <source>Device</source>
          <year>2023</year>
          <volume>1</volume>
          <fpage>100111</fpage>
          <pub-id pub-id-type="doi">10.1016/j.device.2023.100111</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B103">
        <label>103</label>
        <nlm-citation publication-type="web">
          <comment>Pydantic-Ai. 2025. <uri xlink:href="https://github.com/pydantic/pydantic-ai">https://github.com/pydantic/pydantic-ai</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B104">
        <label>104</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Gan</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <etal />
          </person-group>
          <comment>MatSciBench: benchmarking the reasoning ability of large language models in materials science. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2510.12171. <uri xlink:href="https://doi.org/10.48550/arXiv.2510.12171">https://doi.org/10.48550/arXiv.2510.12171</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B105">
        <label>105</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Cheung</surname>
              <given-names>JJ</given-names>
            </name>
            <name>
              <surname>Shen</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Zhuang</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Ramprasad</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <comment>MSQA: benchmarking LLMs on graduate-level materials science reasoning and knowledge. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2505.23982. <uri xlink:href="https://doi.org/10.48550/arXiv.2505.23982">https://doi.org/10.48550/arXiv.2505.23982</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B106">
        <label>106</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Liu</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Hu</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Ye</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Srolovitz</surname>
              <given-names>DJ</given-names>
            </name>
            <name>
              <surname>Wen</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <comment>MatTools: benchmarking large language models for materials science tools. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2505.10852. <uri xlink:href="https://doi.org/10.48550/arXiv.2505.10852">https://doi.org/10.48550/arXiv.2505.10852</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B107">
        <label>107</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Yanguas-Gil</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Dearing</surname>
              <given-names>MT</given-names>
            </name>
            <name>
              <surname>Elam</surname>
              <given-names>JW</given-names>
            </name>
            <etal />
          </person-group>
          <comment>Benchmarking large language models for materials synthesis: the case of atomic layer deposition. <italic>arXiv</italic> <bold>2024</bold>, arXiv:2412.10477. <uri xlink:href="https://doi.org/10.48550/arXiv.2412.10477">https://doi.org/10.48550/arXiv.2412.10477</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B108">
        <label>108</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Riebesell</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Goodall</surname>
              <given-names>REA</given-names>
            </name>
            <name>
              <surname>Benner</surname>
              <given-names>P</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>A framework to evaluate machine learning crystal stability predictions</article-title>
          <source>Nat Mach Intell</source>
          <year>2025</year>
          <volume>7</volume>
          <fpage>836</fpage>
          <lpage>47</lpage>
          <pub-id pub-id-type="doi">10.1038/s42256-025-01055-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B109">
        <label>109</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Fang</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <etal />
          </person-group>
          <comment>RxnBench: a multimodal benchmark for evaluating large language models on chemical reaction understanding from scientific literature. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2512.23565. <uri xlink:href="https://doi.org/10.48550/arXiv.2512.23565">https://doi.org/10.48550/arXiv.2512.23565</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B110">
        <label>110</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Song</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Lu</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Du</surname>
              <given-names>Y</given-names>
            </name>
            <etal />
          </person-group>
          <comment>Evaluating large language models in scientific discovery. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2512.15567. <uri xlink:href="https://doi.org/10.48550/arXiv.2512.15567">https://doi.org/10.48550/arXiv.2512.15567</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B111">
        <label>111</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>He</surname>
              <given-names>X</given-names>
            </name>
            <etal />
          </person-group>
          <comment>Scientists’ first exam: probing cognitive abilities of MLLM via perception, understanding, and reasoning. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2506.10521. <uri xlink:href="https://doi.org/10.48550/arXiv.2506.10521">https://doi.org/10.48550/arXiv.2506.10521</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B112">
        <label>112</label>
        <nlm-citation publication-type="web">
          <comment>LangSmith docs. <uri xlink:href="https://docs.langchain.com/langsmith/home">https://docs.langchain.com/langsmith/home</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B113">
        <label>113</label>
        <nlm-citation publication-type="web">
          <comment>Evals. <uri xlink:href="https://github.com/openai/evals">https://github.com/openai/evals</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B114">
        <label>114</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Es</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>James</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Espinosa-Anke</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Schockaert</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <comment>Ragas: automated evaluation of retrieval augmented generation. <italic>arXiv</italic> <bold>2023</bold>, arXiv:2309.15217. <uri xlink:href="https://doi.org/10.48550/arXiv.2309.15217">https://doi.org/10.48550/arXiv.2309.15217</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B115">
        <label>115</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Kononova</surname>
              <given-names>O</given-names>
            </name>
            <name>
              <surname>He</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Huo</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Trewartha</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Olivetti</surname>
              <given-names>EA</given-names>
            </name>
            <name>
              <surname>Ceder</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Opportunities and challenges of text mining in materials research</article-title>
          <source>iScience</source>
          <year>2021</year>
          <volume>24</volume>
          <fpage>102155</fpage>
          <pub-id pub-id-type="doi">10.1016/j.isci.2021.102155</pub-id>
          <pub-id pub-id-type="pmid">33665573</pub-id>
          <pub-id pub-id-type="pmcid">PMC7905448</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B116">
        <label>116</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Dai</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Coley</surname>
              <given-names>CW</given-names>
            </name>
            <name>
              <surname>Dai</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Song</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <comment>Retrosynthesis prediction with conditional graph logic network. <italic>arXiv</italic> <bold>2020</bold>, arXiv:2001.01408. <uri xlink:href="https://doi.org/10.48550/arXiv.2001.01408">https://doi.org/10.48550/arXiv.2001.01408</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B117">
        <label>117</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Volk</surname>
              <given-names>AA</given-names>
            </name>
            <name>
              <surname>Epps</surname>
              <given-names>RW</given-names>
            </name>
            <name>
              <surname>Yonemoto</surname>
              <given-names>DT</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>AlphaFlow: autonomous discovery and optimization of multi-step chemistry using a self-driven fluidic lab guided by reinforcement learning</article-title>
          <source>Nat Commun</source>
          <year>2023</year>
          <volume>14</volume>
          <fpage>1403</fpage>
          <pub-id pub-id-type="doi">10.1038/s41467-023-37139-y</pub-id>
          <pub-id pub-id-type="pmid">36918561</pub-id>
          <pub-id pub-id-type="pmcid">PMC10015005</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B118">
        <label>118</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Huang</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Cole</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>A database of battery materials auto-generated using ChemDataExtractor</article-title>
          <source>Sci Data</source>
          <year>2020</year>
          <volume>7</volume>
          <fpage>260</fpage>
          <pub-id pub-id-type="doi">10.1038/s41597-020-00602-2</pub-id>
          <pub-id pub-id-type="pmid">32764659</pub-id>
          <pub-id pub-id-type="pmcid">PMC7411033</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B119">
        <label>119</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Yan</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Jiang</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Dang</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Su</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Materials information extraction via automatically generated corpus</article-title>
          <source>Sci Data</source>
          <year>2022</year>
          <volume>9</volume>
          <fpage>401</fpage>
          <pub-id pub-id-type="doi">10.1038/s41597-022-01492-2</pub-id>
          <pub-id pub-id-type="pmid">35831367</pub-id>
          <pub-id pub-id-type="pmcid">PMC9279422</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B120">
        <label>120</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Liu</surname>
              <given-names>Q</given-names>
            </name>
            <name>
              <surname>Polak</surname>
              <given-names>MP</given-names>
            </name>
            <name>
              <surname>Kim</surname>
              <given-names>SY</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Beyond designer’s knowledge: generating materials design hypotheses via large language models</article-title>
          <source>Acta Mater</source>
          <year>2025</year>
          <volume>297</volume>
          <fpage>121307</fpage>
          <pub-id pub-id-type="doi">10.1016/j.actamat.2025.121307</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B121">
        <label>121</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Ghafarollahi</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Buehler</surname>
              <given-names>MJ</given-names>
            </name>
          </person-group>
          <comment>SciAgents: automating scientific discovery through multi-agent intelligent graph reasoning. <italic>arXiv</italic> <bold>2024</bold>, arXiv:2409.05556. <uri xlink:href="https://doi.org/10.48550/arXiv.2409.05556">https://doi.org/10.48550/arXiv.2409.05556</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B122">
        <label>122</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Hawizy</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Jessop</surname>
              <given-names>DM</given-names>
            </name>
            <name>
              <surname>Adams</surname>
              <given-names>N</given-names>
            </name>
            <name>
              <surname>Murray-Rust</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>ChemicalTagger: a tool for semantic text-mining in chemistry</article-title>
          <source>J Cheminform</source>
          <year>2011</year>
          <volume>3</volume>
          <fpage>17</fpage>
          <pub-id pub-id-type="doi">10.1186/1758-2946-3-17</pub-id>
          <pub-id pub-id-type="pmid">21575201</pub-id>
          <pub-id pub-id-type="pmcid">PMC3117806</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B123">
        <label>123</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Swain</surname>
              <given-names>MC</given-names>
            </name>
            <name>
              <surname>Cole</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>ChemDataExtractor: a toolkit for automated extraction of chemical information from the scientific literature</article-title>
          <source>J Chem Inf Model</source>
          <year>2016</year>
          <volume>56</volume>
          <fpage>1894</fpage>
          <lpage>904</lpage>
          <pub-id pub-id-type="doi">10.1021/acs.jcim.6b00207</pub-id>
          <pub-id pub-id-type="pmid">27669338</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B124">
        <label>124</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Kumar</surname>
              <given-names>P</given-names>
            </name>
            <name>
              <surname>Kabra</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Cole</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>A database of stress-strain properties auto-generated from the scientific literature using ChemDataExtractor</article-title>
          <source>Sci Data</source>
          <year>2024</year>
          <volume>11</volume>
          <fpage>1273</fpage>
          <pub-id pub-id-type="doi">10.1038/s41597-024-03979-6</pub-id>
          <pub-id pub-id-type="pmid">39580441</pub-id>
          <pub-id pub-id-type="pmcid">PMC11585639</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B125">
        <label>125</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Tshitoyan</surname>
              <given-names>V</given-names>
            </name>
            <name>
              <surname>Dagdelen</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Weston</surname>
              <given-names>L</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Unsupervised word embeddings capture latent knowledge from materials science literature</article-title>
          <source>Nature</source>
          <year>2019</year>
          <volume>571</volume>
          <fpage>95</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1038/s41586-019-1335-8</pub-id>
          <pub-id pub-id-type="pmid">31270483</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B126">
        <label>126</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Weston</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Tshitoyan</surname>
              <given-names>V</given-names>
            </name>
            <name>
              <surname>Dagdelen</surname>
              <given-names>J</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Named entity recognition and normalization applied to large-scale information extraction from the materials science literature</article-title>
          <source>J Chem Inf Model</source>
          <year>2019</year>
          <volume>59</volume>
          <fpage>3692</fpage>
          <lpage>702</lpage>
          <pub-id pub-id-type="doi">10.1021/acs.jcim.9b00470</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B127">
        <label>127</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Jiang</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Tian</surname>
              <given-names>S</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Alloy synthesis and processing by semi-supervised text mining</article-title>
          <source>npj Comput Mater</source>
          <year>2023</year>
          <volume>9</volume>
          <fpage>183</fpage>
          <pub-id pub-id-type="doi">10.1038/s41524-023-01138-w</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B128">
        <label>128</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>A literature-mining method of integrating text and table extraction for materials science publications</article-title>
          <source>Computa Mater Sci</source>
          <year>2023</year>
          <volume>230</volume>
          <fpage>112441</fpage>
          <pub-id pub-id-type="doi">10.1016/j.commatsci.2023.112441</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B129">
        <label>129</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>An</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Greenberg</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Kalinowski</surname>
              <given-names>A</given-names>
            </name>
            <etal />
          </person-group>
          <comment>Knowledge graph question answering for materials science (KGQA4MAT): developing natural language interface for metal-organic frameworks knowledge graph (MOF-KG) using LLM. <italic>arXiv</italic> <bold>2023</bold>, arXiv:2309.11361. <uri xlink:href="https://doi.org/10.48550/arXiv.2309.11361">https://doi.org/10.48550/arXiv.2309.11361</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B130">
        <label>130</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Dagdelen</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Dunn</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Structured information extraction from complex scientific text with fine-tuned large language models</article-title>
          <source>Nat Commun</source>
          <year>2024</year>
          <volume>15</volume>
          <fpage>1418</fpage>
          <pub-id pub-id-type="doi">10.1038/s41467-024-45563-x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B131">
        <label>131</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Yi</surname>
              <given-names>GH</given-names>
            </name>
            <name>
              <surname>Choi</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Song</surname>
              <given-names>H</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>MaTableGPT: GPT‐based table data extractor from materials science literature</article-title>
          <source>Adv Sci</source>
          <year>2025</year>
          <volume>12</volume>
          <fpage>2408221</fpage>
          <pub-id pub-id-type="doi">10.1002/advs.202408221</pub-id>
          <pub-id pub-id-type="pmid">39853928</pub-id>
          <pub-id pub-id-type="pmcid">PMC12021050</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B132">
        <label>132</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>da Silva</surname>
              <given-names>VT</given-names>
            </name>
            <name>
              <surname>Rademaker</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Lionti</surname>
              <given-names>K</given-names>
            </name>
            <etal />
          </person-group>
          <comment>Automated, LLM enabled extraction of synthesis details for reticular materials from scientific literature. <italic>arXiv</italic> <bold>2024</bold>, arXiv:2411.03484. <uri xlink:href="https://doi.org/10.48550/arXiv.2411.03484">https://doi.org/10.48550/arXiv.2411.03484</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B133">
        <label>133</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Song</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Miret</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <comment>HoneyBee: progressive instruction finetuning of large language models for materials science. <italic>arXiv</italic> <bold>2023</bold>, arXiv:2310.08511. <uri xlink:href="https://doi.org/10.48550/arXiv.2310.08511">https://doi.org/10.48550/arXiv.2310.08511</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B134">
        <label>134</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Wang</surname>
              <given-names>Q</given-names>
            </name>
            <name>
              <surname>Downey</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Ji</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Hope</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <comment>SciMON: scientific inspiration machines optimized for novelty. In <italic>Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)</italic>; 2024 Jul; Bangkok, Thailand. Association for Computational Linguistics; 2024. pp. 279-99.</comment>
          <pub-id pub-id-type="doi">10.18653/v1/2024.acl-long.18</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B135">
        <label>135</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Lai</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Pu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <comment>PriM: principle-inspired material discovery through multi-agent collaboration. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2504.08810. <uri xlink:href="https://doi.org/10.48550/arXiv.2504.08810">https://doi.org/10.48550/arXiv.2504.08810</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B136">
        <label>136</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Macleod</surname>
              <given-names>BP</given-names>
            </name>
            <name>
              <surname>Parlane</surname>
              <given-names>FGL</given-names>
            </name>
            <name>
              <surname>Morrissey</surname>
              <given-names>TD</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Self-driving laboratory for accelerated discovery of thin-film materials</article-title>
          <source>Sci Adv</source>
          <year>2020</year>
          <volume>6</volume>
          <fpage>eaaz8867</fpage>
          <pub-id pub-id-type="doi">10.1126/sciadv.aaz8867</pub-id>
          <pub-id pub-id-type="pmid">32426501</pub-id>
          <pub-id pub-id-type="pmcid">PMC7220369</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B137">
        <label>137</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Boyar</surname>
              <given-names>O</given-names>
            </name>
            <name>
              <surname>Priyadarsini</surname>
              <given-names>I</given-names>
            </name>
            <name>
              <surname>Takeda</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Hamada</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <comment>LLM-fusion: a novel multimodal fusion model for accelerated material discovery. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2503.01022. <uri xlink:href="https://doi.org/10.48550/arXiv.2503.01022">https://doi.org/10.48550/arXiv.2503.01022</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B138">
        <label>138</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Choudhary</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT Material Explorer: design and implementation of a custom GPT assistant for materials science applications</article-title>
          <source>Integr Mater Manuf Innov</source>
          <year>2025</year>
          <volume>14</volume>
          <fpage>276</fpage>
          <lpage>83</lpage>
          <pub-id pub-id-type="doi">10.1007/s40192-025-00410-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B139">
        <label>139</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Wang</surname>
              <given-names>AY</given-names>
            </name>
            <name>
              <surname>Kauwe</surname>
              <given-names>SK</given-names>
            </name>
            <name>
              <surname>Murdock</surname>
              <given-names>RJ</given-names>
            </name>
            <name>
              <surname>Sparks</surname>
              <given-names>TD</given-names>
            </name>
          </person-group>
          <article-title>Compositionally restricted attention-based network for materials property predictions</article-title>
          <source>npj Comput Mater</source>
          <year>2021</year>
          <volume>7</volume>
          <fpage>77</fpage>
          <pub-id pub-id-type="doi">10.1038/s41524-021-00545-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B140">
        <label>140</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Jha</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Ward</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Paul</surname>
              <given-names>A</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>ElemNet: deep learning the chemistry of materials from only elemental composition</article-title>
          <source>Sci Rep</source>
          <year>2018</year>
          <volume>8</volume>
          <fpage>17593</fpage>
          <pub-id pub-id-type="doi">10.1038/s41598-018-35934-y</pub-id>
          <pub-id pub-id-type="pmid">30514926</pub-id>
          <pub-id pub-id-type="pmcid">PMC6279928</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B141">
        <label>141</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Goodall</surname>
              <given-names>REA</given-names>
            </name>
            <name>
              <surname>Lee</surname>
              <given-names>AA</given-names>
            </name>
          </person-group>
          <article-title>Predicting materials properties without crystal structure: deep representation learning from stoichiometry</article-title>
          <source>Nat Commun</source>
          <year>2020</year>
          <volume>11</volume>
          <fpage>6280</fpage>
          <pub-id pub-id-type="doi">10.1038/s41467-020-19964-7</pub-id>
          <pub-id pub-id-type="pmid">33293567</pub-id>
          <pub-id pub-id-type="pmcid">PMC7722901</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B142">
        <label>142</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Wang</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Ouyang</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <etal />
          </person-group>
          <comment>MoMa: a modular deep learning framework for material property prediction. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2502.15483. <uri xlink:href="https://doi.org/10.48550/arXiv.2502.15483">https://doi.org/10.48550/arXiv.2502.15483</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B143">
        <label>143</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Taniai</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Igarashi</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Suzuki</surname>
              <given-names>Y</given-names>
            </name>
            <etal />
          </person-group>
          <comment>Crystalformer: infinitely connected attention for periodic structure encoding. <italic>arXiv</italic> <bold>2024</bold>, arXiv:2403.11686. <uri xlink:href="https://doi.org/10.48550/arXiv.2403.11686">https://doi.org/10.48550/arXiv.2403.11686</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B144">
        <label>144</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Choudhary</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Decost</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Atomistic line graph neural network for improved materials property predictions</article-title>
          <source>npj Comput Mater</source>
          <year>2021</year>
          <volume>7</volume>
          <fpage>185</fpage>
          <pub-id pub-id-type="doi">10.1038/s41524-021-00650-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B145">
        <label>145</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Xie</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Grossman</surname>
              <given-names>JC</given-names>
            </name>
          </person-group>
          <article-title>Crystal graph convolutional neural networks for an accurate and interpretable prediction of material properties</article-title>
          <source>Phys Rev Lett</source>
          <year>2018</year>
          <volume>120</volume>
          <fpage>145301</fpage>
          <pub-id pub-id-type="doi">10.1103/physrevlett.120.145301</pub-id>
          <pub-id pub-id-type="pmid">29694125</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B146">
        <label>146</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Yan</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Lin</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Ji</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <comment>Periodic graph transformers for crystal material property prediction. <italic>arXiv</italic> <bold>2022</bold>, arXiv:2209.11807. <uri xlink:href="https://doi.org/10.48550/arXiv.2209.11807">https://doi.org/10.48550/arXiv.2209.11807</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B147">
        <label>147</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Nouira</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Sokolovska</surname>
              <given-names>N</given-names>
            </name>
            <name>
              <surname>Crivello</surname>
              <given-names>JC</given-names>
            </name>
          </person-group>
          <comment>CrystalGAN: learning to discover crystallographic structures with generative adversarial networks. <italic>arXiv</italic> <bold>2018</bold>, arXiv:1810.11203. <uri xlink:href="https://doi.org/10.48550/arXiv.1810.11203">https://doi.org/10.48550/arXiv.1810.11203</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B148">
        <label>148</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Bagal</surname>
              <given-names>V</given-names>
            </name>
            <name>
              <surname>Aggarwal</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Vinod</surname>
              <given-names>PK</given-names>
            </name>
            <name>
              <surname>Priyakumar</surname>
              <given-names>UD</given-names>
            </name>
          </person-group>
          <article-title>MolGPT: molecular generation using a transformer-decoder model</article-title>
          <source>J Chem Inf Model</source>
          <year>2021</year>
          <volume>62</volume>
          <fpage>2064</fpage>
          <lpage>76</lpage>
          <pub-id pub-id-type="doi">10.1021/acs.jcim.1c00600</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B149">
        <label>149</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Cao</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Jiao</surname>
              <given-names>R</given-names>
            </name>
            <etal />
          </person-group>
          <comment>Materials generation in the era of artificial intelligence: a comprehensive survey. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2505.16379. <uri xlink:href="https://doi.org/10.48550/arXiv.2505.16379">https://doi.org/10.48550/arXiv.2505.16379</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B150">
        <label>150</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Xu</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Desai</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Hope</surname>
              <given-names>G</given-names>
            </name>
            <name>
              <surname>Ritz</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <comment>PLaID++: a preference aligned language model for targeted inorganic materials design. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2509.07150. <uri xlink:href="https://doi.org/10.48550/arXiv.2509.07150">https://doi.org/10.48550/arXiv.2509.07150</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B151">
        <label>151</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zeni</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Pinsler</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Zügner</surname>
              <given-names>D</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>A generative model for inorganic materials design</article-title>
          <source>Nature</source>
          <year>2025</year>
          <volume>639</volume>
          <fpage>624</fpage>
          <lpage>32</lpage>
          <pub-id pub-id-type="doi">10.1038/s41586-025-08628-5</pub-id>
          <pub-id pub-id-type="pmid">39821164</pub-id>
          <pub-id pub-id-type="pmcid">PMC11922738</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B152">
        <label>152</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Karpovich</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Pan</surname>
              <given-names>E</given-names>
            </name>
            <name>
              <surname>Olivetti</surname>
              <given-names>EA</given-names>
            </name>
          </person-group>
          <article-title>Deep reinforcement learning for inverse inorganic materials design</article-title>
          <source>Npj Comput Mater</source>
          <year>2024</year>
          <volume>10</volume>
          <fpage>287</fpage>
          <pub-id pub-id-type="doi">10.1038/s41524-024-01474-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B153">
        <label>153</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Cleeton</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Sarkisov</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Inverse design of metal-organic frameworks using deep dreaming approaches</article-title>
          <source>Nat Commun</source>
          <year>2025</year>
          <volume>16</volume>
          <fpage>4806</fpage>
          <pub-id pub-id-type="doi">10.1038/s41467-025-59952-3</pub-id>
          <pub-id pub-id-type="pmid">40410161</pub-id>
          <pub-id pub-id-type="pmcid">PMC12102185</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B154">
        <label>154</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zuo</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Qin</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Chen</surname>
              <given-names>C</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Accelerating materials discovery with Bayesian optimization and graph deep learning</article-title>
          <source>Mater Today</source>
          <year>2021</year>
          <volume>51</volume>
          <fpage>126</fpage>
          <lpage>35</lpage>
          <pub-id pub-id-type="doi">10.1016/j.mattod.2021.08.012</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B155">
        <label>155</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Huang</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Xing</surname>
              <given-names>Q</given-names>
            </name>
            <name>
              <surname>Ji</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Yang</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <comment>Code-generated graph representations using multiple LLM agents for material properties prediction. In <italic>Proceedings of the 42nd International Conference on Machine Learning</italic>. PMLR; 2025. pp. 25972-86. <uri xlink:href="https://proceedings.mlr.press/v267/huang25an.html">https://proceedings.mlr.press/v267/huang25an.html</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B156">
        <label>156</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Ghafarollahi</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Buehler</surname>
              <given-names>MJ</given-names>
            </name>
          </person-group>
          <comment>Autonomous inorganic materials discovery via multi-agent physics-aware scientific reasoning. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2508.02956. <uri xlink:href="https://doi.org/10.48550/arXiv.2508.02956">https://doi.org/10.48550/arXiv.2508.02956</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B157">
        <label>157</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Hjorth Larsen</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Jørgen Mortensen</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Blomqvist</surname>
              <given-names>J</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>The atomic simulation environment - a Python library for working with atoms</article-title>
          <source>J Phys Condens Matter</source>
          <year>2017</year>
          <volume>29</volume>
          <fpage>273002</fpage>
          <pub-id pub-id-type="doi">10.1088/1361-648x/aa680e</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B158">
        <label>158</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Chandrasekhar</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Farimani</surname>
              <given-names>AB</given-names>
            </name>
          </person-group>
          <comment>Automating MD simulations for proteins using large language models: NAMD-agent. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2507.07887. <uri xlink:href="https://doi.org/10.48550/arXiv.2507.07887">https://doi.org/10.48550/arXiv.2507.07887</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B159">
        <label>159</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Huang</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Zhao</surname>
              <given-names>H</given-names>
            </name>
            <etal />
          </person-group>
          <comment>DREAMS: density functional theory based research engine for agentic materials simulation. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2507.14267. <uri xlink:href="https://doi.org/10.48550/arXiv.2507.14267">https://doi.org/10.48550/arXiv.2507.14267</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B160">
        <label>160</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Deng</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Zhong</surname>
              <given-names>P</given-names>
            </name>
            <name>
              <surname>Jun</surname>
              <given-names>K</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>CHGNet as a pretrained universal neural network potential for charge-informed atomistic modelling</article-title>
          <source>Nat Mach Intell</source>
          <year>2023</year>
          <volume>5</volume>
          <fpage>1031</fpage>
          <lpage>41</lpage>
          <pub-id pub-id-type="doi">10.1038/s42256-023-00716-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B161">
        <label>161</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Batzner</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Musaelian</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Sun</surname>
              <given-names>L</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>E(3)-equivariant graph neural networks for data-efficient and accurate interatomic potentials</article-title>
          <source>Nat Commun</source>
          <year>2022</year>
          <volume>13</volume>
          <fpage>2453</fpage>
          <pub-id pub-id-type="doi">10.1038/s41467-022-29939-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B162">
        <label>162</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Musaelian</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Batzner</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Johansson</surname>
              <given-names>A</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Learning local equivariant representations for large-scale atomistic dynamics</article-title>
          <source>Nat Commun</source>
          <year>2023</year>
          <volume>14</volume>
          <fpage>579</fpage>
          <pub-id pub-id-type="doi">10.1038/s41467-023-36329-y</pub-id>
          <pub-id pub-id-type="pmid">36737620</pub-id>
          <pub-id pub-id-type="pmcid">PMC9898554</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B163">
        <label>163</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>DPA-2: a large atomic model as a multi-task learner</article-title>
          <source>npj Comput Mater</source>
          <year>2024</year>
          <volume>10</volume>
          <fpage>293</fpage>
          <pub-id pub-id-type="doi">10.1038/s41524-024-01493-2</pub-id>
          <pub-id pub-id-type="pmid">40851785</pub-id>
          <pub-id pub-id-type="pmcid">PMC12369844</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B164">
        <label>164</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Batatia</surname>
              <given-names>I</given-names>
            </name>
            <name>
              <surname>Benner</surname>
              <given-names>P</given-names>
            </name>
            <name>
              <surname>Chiang</surname>
              <given-names>Y</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>A foundation model for atomistic materials chemistry</article-title>
          <source>J Chem Phys</source>
          <year>2025</year>
          <volume>163</volume>
          <fpage>184110</fpage>
          <pub-id pub-id-type="doi">10.1063/5.0297006</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B165">
        <label>165</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Yang</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Hu</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
            <etal />
          </person-group>
          <comment>MatterSim: a deep learning atomistic model across elements, temperatures and pressures. <italic>arXiv</italic> <bold>2024</bold>, arXiv:2405.04967. <uri xlink:href="https://doi.org/10.48550/arXiv.2405.04967">https://doi.org/10.48550/arXiv.2405.04967</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B166">
        <label>166</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Chen</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Ong</surname>
              <given-names>SP</given-names>
            </name>
          </person-group>
          <article-title>A universal graph deep learning interatomic potential for the periodic table</article-title>
          <source>Nat Comput Sci</source>
          <year>2022</year>
          <volume>2</volume>
          <fpage>718</fpage>
          <lpage>28</lpage>
          <pub-id pub-id-type="doi">10.1038/s43588-022-00349-3</pub-id>
          <pub-id pub-id-type="pmid">38177366</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B167">
        <label>167</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Li</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Bazant</surname>
              <given-names>MZ</given-names>
            </name>
            <name>
              <surname>Zhu</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Phase-Field DeepONet: Physics-informed deep operator neural network for fast simulations of pattern formation governed by gradient flows of free-energy functionals</article-title>
          <source>Comput Methods Appl Mech Eng</source>
          <year>2023</year>
          <volume>416</volume>
          <fpage>116299</fpage>
          <pub-id pub-id-type="doi">10.1016/j.cma.2023.116299</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B168">
        <label>168</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Haghighat</surname>
              <given-names>E</given-names>
            </name>
            <name>
              <surname>Raissi</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Moure</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Gomez</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Juanes</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>A physics-informed deep learning framework for inversion and surrogate modeling in solid mechanics</article-title>
          <source>Comput Methods Appl Mech Eng</source>
          <year>2021</year>
          <volume>379</volume>
          <fpage>113741</fpage>
          <pub-id pub-id-type="doi">10.1016/j.cma.2021.113741</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B169">
        <label>169</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Campbell</surname>
              <given-names>Q</given-names>
            </name>
            <name>
              <surname>Cox</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Medina</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Watterson</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>White</surname>
              <given-names>AD</given-names>
            </name>
          </person-group>
          <comment>MDCrow: automating molecular dynamics workflows with large language models. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2502.09565. <uri xlink:href="https://doi.org/10.48550/arXiv.2502.09565">https://doi.org/10.48550/arXiv.2502.09565</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B170">
        <label>170</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Shi</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Xin</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Huo</surname>
              <given-names>T</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>A fine-tuned large language model based molecular dynamics agent for code generation to obtain material thermodynamic parameters</article-title>
          <source>Sci Rep</source>
          <year>2025</year>
          <volume>15</volume>
          <fpage>10295</fpage>
          <pub-id pub-id-type="doi">10.1038/s41598-025-92337-6</pub-id>
          <pub-id pub-id-type="pmid">40133325</pub-id>
          <pub-id pub-id-type="pmcid">PMC11937566</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B171">
        <label>171</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zou</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Cheng</surname>
              <given-names>AH</given-names>
            </name>
            <name>
              <surname>Aldossary</surname>
              <given-names>A</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>El Agente: an autonomous agent for quantum chemistry</article-title>
          <source>Matter</source>
          <year>2025</year>
          <volume>8</volume>
          <fpage>102263</fpage>
          <pub-id pub-id-type="doi">10.1016/j.matt.2025.102263</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B172">
        <label>172</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Xin</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Jiao</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <comment>MooseAgent: a LLM based multi-agent framework for automating moose simulation. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2504.08621. <uri xlink:href="https://doi.org/10.48550/arXiv.2504.08621">https://doi.org/10.48550/arXiv.2504.08621</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B173">
        <label>173</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Ghafarollahi</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Buehler</surname>
              <given-names>MJ</given-names>
            </name>
          </person-group>
          <comment>AtomAgents: alloy design and discovery through physics-aware multi-modal multi-agent artificial intelligence. <italic>arXiv</italic> <bold>2024</bold>, arXiv:2407.10022. <uri xlink:href="https://doi.org/10.48550/arXiv.2407.10022">https://doi.org/10.48550/arXiv.2407.10022</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B174">
        <label>174</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Chaudhari</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Ock</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Barati Farimani</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Modular large language model agents for multi-task computational materials science</article-title>
          <source>Commun Mater</source>
          <year>2026</year>
          <volume>7</volume>
		  <fpage>131</fpage>
          <pub-id pub-id-type="doi">10.1038/s43246-025-00994-x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B175">
        <label>175</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Gottweis</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Weng</surname>
              <given-names>WH</given-names>
            </name>
            <name>
              <surname>Daryin</surname>
              <given-names>A</given-names>
            </name>
            <etal />
          </person-group>
          <comment>Towards an AI co-scientist. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2502.18864. <uri xlink:href="https://doi.org/10.48550/arXiv.2502.18864">https://doi.org/10.48550/arXiv.2502.18864</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B176">
        <label>176</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Abolhasani</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Kumacheva</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>The rise of self-driving labs in chemical and materials sciences</article-title>
          <source>Nat Synth</source>
          <year>2023</year>
          <volume>2</volume>
          <fpage>483</fpage>
          <lpage>92</lpage>
          <pub-id pub-id-type="doi">10.1038/s44160-022-00231-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B177">
        <label>177</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Guha</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Mullick</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Agrawal</surname>
              <given-names>J</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>MatScIE: an automated tool for the generation of databases of methods and parameters used in the computational materials science literature</article-title>
          <source>Comput Mater Sci</source>
          <year>2021</year>
          <volume>192</volume>
          <fpage>110325</fpage>
          <pub-id pub-id-type="doi">10.1016/j.commatsci.2021.110325</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B178">
        <label>178</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Stricker</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>MatNexus: a comprehensive text mining and analysis suite for materials discovery</article-title>
          <source>SoftwareX</source>
          <year>2024</year>
          <volume>26</volume>
          <fpage>101654</fpage>
          <pub-id pub-id-type="doi">10.1016/j.softx.2024.101654</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B179">
        <label>179</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Jalali</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Luo</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Caulfield</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Sauter</surname>
              <given-names>E</given-names>
            </name>
            <name>
              <surname>Nefedov</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Wöll</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Large language models in electronic laboratory notebooks: transforming materials science research workflows</article-title>
          <source>Mater Today Commun</source>
          <year>2024</year>
          <volume>40</volume>
          <fpage>109801</fpage>
          <pub-id pub-id-type="doi">10.1016/j.mtcomm.2024.109801</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B180">
        <label>180</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>He</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Huo</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Bartel</surname>
              <given-names>CJ</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Cruse</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Ceder</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Precursor recommendation for inorganic synthesis by machine learning materials similarity from scientific literature</article-title>
          <source>Sci Adv</source>
          <year>2023</year>
          <volume>9</volume>
          <fpage>eadg8180</fpage>
          <pub-id pub-id-type="doi">10.1126/sciadv.adg8180</pub-id>
          <pub-id pub-id-type="pmid">37294767</pub-id>
          <pub-id pub-id-type="pmcid">PMC10256153</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B181">
        <label>181</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zheng</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>O</given-names>
            </name>
            <name>
              <surname>Nguyen</surname>
              <given-names>HL</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>ChatGPT Research Group for Optimizing the Crystallinity of MOFs and COFs</article-title>
          <source>ACS Cent Sci</source>
          <year>2023</year>
          <volume>9</volume>
          <fpage>2161</fpage>
          <lpage>70</lpage>
          <pub-id pub-id-type="doi">10.1021/acscentsci.3c01087</pub-id>
          <pub-id pub-id-type="pmid">38033801</pub-id>
          <pub-id pub-id-type="pmcid">PMC10683477</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B182">
        <label>182</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Cissé</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Evangelopoulos</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Gusev</surname>
              <given-names>VV</given-names>
            </name>
            <name>
              <surname>Cooper</surname>
              <given-names>AI</given-names>
            </name>
          </person-group>
          <comment>Language-based Bayesian optimization research assistant (BORA). In <italic>Proceedings of the Thirty-Fourth International Joint Conference on Artificial Intelligen</italic>, Aug 16-22, 2025; Montreal, Canada. California: International Joint Conferences on Artificial Intelligence Organization; 2025. pp. 4967-75.</comment>
          <pub-id pub-id-type="doi">10.24963/ijcai.2025/553</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B183">
        <label>183</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Liu</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Astorga</surname>
              <given-names>N</given-names>
            </name>
            <name>
              <surname>Seedat</surname>
              <given-names>N</given-names>
            </name>
            <name>
              <surname>van der Schaar</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <comment>Large language models to enhance bayesian optimization. <italic>arXiv</italic> <bold>2024</bold>, arXiv:2402.03921. <uri xlink:href="https://doi.org/10.48550/arXiv.2402.03921">https://doi.org/10.48550/arXiv.2402.03921</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B184">
        <label>184</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Chang</surname>
              <given-names>CY</given-names>
            </name>
            <name>
              <surname>Azvar</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Okwudire</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Kontar</surname>
              <given-names>RA</given-names>
            </name>
          </person-group>
          <comment>LLINBO: trustworthy LLM-in-the-loop bayesian optimization. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2505.14756. <uri xlink:href="https://doi.org/10.48550/arXiv.2505.14756">https://doi.org/10.48550/arXiv.2505.14756</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B185">
        <label>185</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Ge</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Fu</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <comment>Reasoning BO: enhancing Bayesian optimization with long-context reasoning power of LLMs. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2505.12833. <uri xlink:href="https://doi.org/10.48550/arXiv.2505.12833">https://doi.org/10.48550/arXiv.2505.12833</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B186">
        <label>186</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Guo</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Guo</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Nan</surname>
              <given-names>B</given-names>
            </name>
            <etal />
          </person-group>
          <comment>What can large language models do in chemistry? A comprehensive benchmark on eight tasks. <italic>arXiv</italic> <bold>2023</bold>, arXiv:2305.18365. <uri xlink:href="https://doi.org/10.48550/arXiv.2305.18365">https://doi.org/10.48550/arXiv.2305.18365</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B187">
        <label>187</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Wu</surname>
              <given-names>W</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>MaterialBrain: high-performance material synthesis extraction via human–AI-curated few-shot large language models</article-title>
          <source>J Chem Inf Model</source>
          <year>2025</year>
          <volume>66</volume>
          <fpage>228</fpage>
          <lpage>45</lpage>
          <pub-id pub-id-type="doi">10.1021/acs.jcim.5c02299</pub-id>
          <pub-id pub-id-type="pmid">41449076</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B188">
        <label>188</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Mcdermott</surname>
              <given-names>MJ</given-names>
            </name>
            <name>
              <surname>Dwaraknath</surname>
              <given-names>SS</given-names>
            </name>
            <name>
              <surname>Persson</surname>
              <given-names>KA</given-names>
            </name>
          </person-group>
          <article-title>A graph-based network for predicting chemical reaction pathways in solid-state materials synthesis</article-title>
          <source>Nat Commun</source>
          <year>2021</year>
          <volume>12</volume>
          <fpage>3097</fpage>
          <pub-id pub-id-type="doi">10.1038/s41467-021-23339-x</pub-id>
          <pub-id pub-id-type="pmid">34035255</pub-id>
          <pub-id pub-id-type="pmcid">PMC8149458</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B189">
        <label>189</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Qu</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Huang</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Yin</surname>
              <given-names>M</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>CRISPR-GPT for agentic automation of gene-editing experiments</article-title>
          <source>Nat Biomed Eng</source>
          <year>2025</year>
          <volume>10</volume>
          <fpage>245</fpage>
          <lpage>58</lpage>
          <pub-id pub-id-type="doi">10.1038/s41551-025-01463-z</pub-id>
          <pub-id pub-id-type="pmid">40738974</pub-id>
          <pub-id pub-id-type="pmcid">PMC12920143</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B190">
        <label>190</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Acharya</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Sharma</surname>
              <given-names>AK</given-names>
            </name>
            <name>
              <surname>Parker</surname>
              <given-names>D</given-names>
            </name>
            <etal />
          </person-group>
          <comment>LABMATE: language model based multi-agent system to accelerate catalysis experiments. In <italic>Proceedings of the SC '25 Workshops of the International Conference for High Performance Computing, Networking, Storage and Analysis, Association for Computing Machinery</italic>; 2025. pp. 607-15.</comment>
          <pub-id pub-id-type="doi">10.1145/3731599.3767399</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B191">
        <label>191</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Sarkar</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Lu</surname>
              <given-names>W</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Collective intelligence for AI-assisted chemical synthesis</article-title>
          <source>Nature</source>
          <year>2026</year>
          <volume>651</volume>
          <fpage>107</fpage>
          <lpage>15</lpage>
          <pub-id pub-id-type="doi">10.1038/s41586-026-10131-4</pub-id>
          <pub-id pub-id-type="pmid">41554982</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B192">
        <label>192</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Fan</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Huang</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>AutoMEX: streamlining material extrusion with AI agents powered by large language models and knowledge graphs</article-title>
          <source>Mater Design</source>
          <year>2025</year>
          <volume>251</volume>
          <fpage>113644</fpage>
          <pub-id pub-id-type="doi">10.1016/j.matdes.2025.113644</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B193">
        <label>193</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Tao</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Wu</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Kheiri</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Aldeghi</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Aspuru‐Guzik</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Kumacheva</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Self‐driving platform for metal nanoparticle synthesis: combining microfluidics and machine learning</article-title>
          <source>Adv Funct Mater</source>
          <year>2021</year>
          <volume>31</volume>
          <fpage>2106725</fpage>
          <pub-id pub-id-type="doi">10.1002/adfm.202106725</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B194">
        <label>194</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Sadeghi</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Bateni</surname>
              <given-names>F</given-names>
            </name>
            <name>
              <surname>Kim</surname>
              <given-names>T</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Autonomous nanomanufacturing of lead-free metal halide perovskite nanocrystals using a self-driving fluidic lab</article-title>
          <source>Nanoscale</source>
          <year>2024</year>
          <volume>16</volume>
          <fpage>580</fpage>
          <lpage>91</lpage>
          <pub-id pub-id-type="doi">10.1039/d3nr05034c</pub-id>
          <pub-id pub-id-type="pmid">38116636</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B195">
        <label>195</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Burger</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Maffettone</surname>
              <given-names>PM</given-names>
            </name>
            <name>
              <surname>Gusev</surname>
              <given-names>VV</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>A mobile robotic chemist</article-title>
          <source>Nature</source>
          <year>2020</year>
          <volume>583</volume>
          <fpage>237</fpage>
          <lpage>41</lpage>
          <pub-id pub-id-type="doi">10.1038/s41586-020-2442-2</pub-id>
          <pub-id pub-id-type="pmid">32641813</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B196">
        <label>196</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Hysmith</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Foadian</surname>
              <given-names>E</given-names>
            </name>
            <name>
              <surname>Padhy</surname>
              <given-names>SP</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>The future of self-driving laboratories: from human in the loop interactive AI to gamification</article-title>
          <source>Digital Discov</source>
          <year>2024</year>
          <volume>3</volume>
          <fpage>621</fpage>
          <lpage>36</lpage>
          <pub-id pub-id-type="doi">10.1039/d4dd00040d</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B197">
        <label>197</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Weng</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Gao</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Zhu</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Huang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <comment>MatQnA: a benchmark dataset for multi-modal large language models in materials characterization and analysis. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2509.11335. <uri xlink:href="https://doi.org/10.48550/arXiv.2509.11335">https://doi.org/10.48550/arXiv.2509.11335</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B198">
        <label>198</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Guo</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Huo</surname>
              <given-names>P</given-names>
            </name>
            <etal />
          </person-group>
          <comment>S1-MMAlign: a large-scale, multi-disciplinary dataset for scientific figure-text understanding. <italic>arXiv</italic> <bold>2026</bold>, arXiv:2601.00264. <uri xlink:href="https://doi.org/10.48550/arXiv.2601.00264">https://doi.org/10.48550/arXiv.2601.00264</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B199">
        <label>199</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Botifoll</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Pinto‐Huguet</surname>
              <given-names>I</given-names>
            </name>
            <name>
              <surname>Rotunno</surname>
              <given-names>E</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Artificial intelligence‐assisted workflow for transmission electron microscopy: from data analysis automation to materials knowledge unveiling</article-title>
          <source>Adv Mater</source>
          <year>2025</year>
          <fpage>e06785</fpage>
          <pub-id pub-id-type="doi">10.1002/adma.202506785</pub-id>
          <pub-id pub-id-type="pmid">41122804</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B200">
        <label>200</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Davel</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Bassiri-Gharb</surname>
              <given-names>N</given-names>
            </name>
            <name>
              <surname>Correa-Baena</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Machine learning in X-ray diffraction for materials discovery and characterization</article-title>
          <source>Matter</source>
          <year>2025</year>
          <volume>8</volume>
          <fpage>102272</fpage>
          <pub-id pub-id-type="doi">10.1016/j.matt.2025.102272</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B201">
        <label>201</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Cao</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Zheng</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>XQueryer: an intelligent crystal structure identifier for powder X-ray diffraction</article-title>
          <source>Natl Sci Rev</source>
          <year>2025</year>
          <volume>12</volume>
          <fpage>nwaf421</fpage>
          <pub-id pub-id-type="doi">10.1093/nsr/nwaf421</pub-id>
          <pub-id pub-id-type="pmid">41293600</pub-id>
          <pub-id pub-id-type="pmcid">PMC12641137</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B202">
        <label>202</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Li</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Han</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Yao</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Ban</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <comment>MatSAM: efficient extraction of microstructures of materials via visual large model. <italic>arXiv</italic> <bold>2024</bold>, arXiv:2401.05638. <uri xlink:href="https://doi.org/10.48550/arXiv.2401.05638">https://doi.org/10.48550/arXiv.2401.05638</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B203">
        <label>203</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Anker</surname>
              <given-names>AS</given-names>
            </name>
            <name>
              <surname>Butler</surname>
              <given-names>KT</given-names>
            </name>
            <name>
              <surname>Selvan</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Jensen</surname>
              <given-names>KMØ</given-names>
            </name>
          </person-group>
          <article-title>Machine learning for analysis of experimental scattering and spectroscopy data in materials chemistry</article-title>
          <source>Chem Sci</source>
          <year>2023</year>
          <volume>14</volume>
          <fpage>14003</fpage>
          <lpage>19</lpage>
          <pub-id pub-id-type="doi">10.1039/d3sc05081e</pub-id>
          <pub-id pub-id-type="pmid">38098730</pub-id>
          <pub-id pub-id-type="pmcid">PMC10718081</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B204">
        <label>204</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Choudhary</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>MicroscopyGPT: generating atomic-structure captions from microscopy images of 2D materials with vision-language transformers</article-title>
          <source>J Phys Chem Lett</source>
          <year>2025</year>
          <volume>16</volume>
          <fpage>7028</fpage>
          <lpage>35</lpage>
          <pub-id pub-id-type="doi">10.1021/acs.jpclett.5c01257</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B205">
        <label>205</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Yang</surname>
              <given-names>R</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Ahmed</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <comment>A large-language-model assisted automated scale bar detection and extraction framework for scanning electron microscopic images. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2510.11260. <uri xlink:href="https://doi.org/10.48550/arXiv.2510.11260">https://doi.org/10.48550/arXiv.2510.11260</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B206">
        <label>206</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Fei</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>McDermott</surname>
              <given-names>MJ</given-names>
            </name>
            <name>
              <surname>Rom</surname>
              <given-names>CL</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Ceder</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <comment>Dara: automated multiple-hypothesis phase identification and refinement from powder X-ray diffraction. <italic>Chem. Mater.</italic> <bold>2026</bold>, <italic>38</italic>, 1364-76.</comment>
          <pub-id pub-id-type="doi">10.1021/acs.chemmater.5c02820</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B207">
        <label>207</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Bazgir</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <comment>Drug discovery agent: an automated vision detection system for drug-cell interactions. In <italic>IEEE/CVF Conference on Computer Vision and Pattern Recognition Workshops</italic>, CVPR Workshops 2025, 2025; pp. 4308-16. <uri xlink:href="https://openaccess.thecvf.com/content/CVPR2025W/CVDD/html/Bazgir_Drug_Discovery_Agent_An_Automated_Vision_Detection_System_for_Drug-Cell_CVPRW_2025_paper.html">https://openaccess.thecvf.com/content/CVPR2025W/CVDD/html/Bazgir_Drug_Discovery_Agent_An_Automated_Vision_Detection_System_for_Drug-Cell_CVPRW_2025_paper.html</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B208">
        <label>208</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Bazgir</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <comment>Matagent: a human-in-the-loop multi-agent LLM framework for accelerating the material science discovery cycle. In <italic>AI for Accelerated Materials Design-ICLR 2025</italic>, 2025. <uri xlink:href="https://openreview.net/pdf/7c4f3b61beb01e7f4740671b78cd1f777bd0e60a.pdf">https://openreview.net/pdf/7c4f3b61beb01e7f4740671b78cd1f777bd0e60a.pdf</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B209">
        <label>209</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Yao</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Samantray</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Ghosh</surname>
              <given-names>A</given-names>
            </name>
            <etal />
          </person-group>
          <comment>Operationalizing serendipity: multi-agent AI workflows for enhanced materials characterization with theory-in-the-loop. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2508.06569. <uri xlink:href="https://doi.org/10.48550/arXiv.2508.06569">https://doi.org/10.48550/arXiv.2508.06569</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B210">
        <label>210</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Tang</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <etal />
          </person-group>
          <comment>AutoMat: enabling automated crystal structure reconstruction from microscopy via agentic tool use. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2505.12650. <uri xlink:href="https://doi.org/10.48550/arXiv.2505.12650">https://doi.org/10.48550/arXiv.2505.12650</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B211">
        <label>211</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Noh</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Lee</surname>
              <given-names>N</given-names>
            </name>
            <name>
              <surname>Na</surname>
              <given-names>GS</given-names>
            </name>
            <name>
              <surname>Kim</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Park</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <comment>IR-agent: expert-inspired LLM agents for structure elucidation from infrared spectra. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2508.16112. <uri xlink:href="https://doi.org/10.48550/arXiv.2508.16112">https://doi.org/10.48550/arXiv.2508.16112</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B212">
        <label>212</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Mandal</surname>
              <given-names>I</given-names>
            </name>
            <name>
              <surname>Soni</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Zaki</surname>
              <given-names>M</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Evaluating large language model agents for automation of atomic force microscopy</article-title>
          <source>Nat Commun</source>
          <year>2025</year>
          <volume>16</volume>
          <fpage>9104</fpage>
          <pub-id pub-id-type="doi">10.1038/s41467-025-64105-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B213">
        <label>213</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Darvish</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Skreta</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Zhao</surname>
              <given-names>Y</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>ORGANA: a robotic assistant for automated chemistry experimentation and characterization</article-title>
          <source>Matter</source>
          <year>2025</year>
          <volume>8</volume>
          <fpage>101897</fpage>
          <pub-id pub-id-type="doi">10.1016/j.matt.2024.10.015</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B214">
        <label>214</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Jia</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Fung</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <comment>LLMatDesign: autonomous materials discovery with large language models. <italic>arXiv</italic> <bold>2024</bold>, arXiv:2406.13163. <uri xlink:href="https://doi.org/10.48550/arXiv.2406.13163">https://doi.org/10.48550/arXiv.2406.13163</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B215">
        <label>215</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Nikolaev</surname>
              <given-names>P</given-names>
            </name>
            <name>
              <surname>Hooper</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Webber</surname>
              <given-names>F</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Autonomy in materials research: a case study in carbon nanotube growth</article-title>
          <source>npj Comput Mater</source>
          <year>2016</year>
          <volume>2</volume>
          <fpage>16031</fpage>
          <pub-id pub-id-type="doi">10.1038/npjcompumats.2016.31</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B216">
        <label>216</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Ye</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Yuan</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Fu</surname>
              <given-names>P</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>A full-process artificial intelligence framework for perovskite solar cells</article-title>
          <source>Sci China Mater</source>
          <year>2025</year>
          <volume>68</volume>
          <fpage>2526</fpage>
          <lpage>35</lpage>
          <pub-id pub-id-type="doi">10.1007/s40843-025-3416-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B217">
        <label>217</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Ruan</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Lu</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Xu</surname>
              <given-names>N</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>An automatic end-to-end chemical synthesis development platform powered by large language models</article-title>
          <source>Nat Commun</source>
          <year>2024</year>
          <volume>15</volume>
          <fpage>10160</fpage>
          <pub-id pub-id-type="doi">10.1038/s41467-024-54457-x</pub-id>
          <pub-id pub-id-type="pmid">39580482</pub-id>
          <pub-id pub-id-type="pmcid">PMC11585555</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B218">
        <label>218</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Jin</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Wu</surname>
              <given-names>Q</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <comment>TopoMAS: large language model driven topological materials multiagent system. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2507.04053. <uri xlink:href="https://doi.org/10.48550/arXiv.2507.04053">https://doi.org/10.48550/arXiv.2507.04053</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B219">
        <label>219</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Ely</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Ajith</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Campbell</surname>
              <given-names>CR</given-names>
            </name>
            <name>
              <surname>Choudhary</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <comment>AGAPI-agents: an open-access agentic AI Platform For Accelerated Materials Design on AtomGPT.org. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2512.11935. <uri xlink:href="https://doi.org/10.48550/arXiv.2512.11935">https://doi.org/10.48550/arXiv.2512.11935</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B220">
        <label>220</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Shen</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
            <name>
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>Unlocking azobenzene isomerization mechanisms <italic>via</italic> an LLM agent-driven workflow integrating simulation, experiment, and machine learning</article-title>
          <source>Chem Sci</source>
          <year>2026</year>
          <pub-id pub-id-type="doi">10.1039/D5SC08794E</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B221">
        <label>221</label>
        <nlm-citation publication-type="book">
          <comment>Juchli, D. SiLA 2: the next generation lab automation standard. In <italic>Smart Biolabs of the Future</italic>, Beutel, S., Lenk, F. Eds.; Springer International Publishing, 2022; pp. 147–74.</comment>
		  <pub-id pub-id-type="doi">10.1007/10_2022_204</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B222">
        <label>222</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Roch</surname>
              <given-names>LM</given-names>
            </name>
            <name>
              <surname>Häse</surname>
              <given-names>F</given-names>
            </name>
            <name>
              <surname>Aspuru-Guzik</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <comment>Chapter 16: ChemOS: an orchestration software to democratize autonomous discovery. In: Brown, N.; Editors. <italic>Artificial Intelligence In Drug Discovery</italic>. Cambridge: Royal Society of Chemistry; 2020. pp. 349-88.</comment>
          <pub-id pub-id-type="doi">10.1039/9781788016841-00349</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B223">
        <label>223</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Quigley</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Conley</surname>
              <given-names>K</given-names>
            </name>
            <name>
              <surname>Gerkey</surname>
              <given-names>B</given-names>
            </name>
            <etal />
          </person-group>
          <comment>ROS: an open-source Robot Operating System. In <italic>ICRA workshop on open source software</italic>, 2009. <uri xlink:href="http://lars.mec.ua.pt/public/LAR%20Projects/BinPicking/2016_RodrigoSalgueiro/LIB/ROS/icraoss09-ROS.pdf">http://lars.mec.ua.pt/public/LAR%20Projects/BinPicking/2016_RodrigoSalgueiro/LIB/ROS/icraoss09-ROS.pdf</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B224">
        <label>224</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Fawzy</surname>
              <given-names>SM</given-names>
            </name>
            <name>
              <surname>M</surname>
              <given-names />
            </name>
          </person-group>
          <article-title>Ali MK, Allam NK. Artificial intelligence-driven materials design for next-generation sustainable energy technologies</article-title>
          <source>ACS Sustain Chem Eng</source>
          <year>2026</year>
          <volume>14</volume>
          <fpage>4745</fpage>
          <lpage>61</lpage>
          <pub-id pub-id-type="doi">10.1021/acssuschemeng.6c01084</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B225">
        <label>225</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Bouchard</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Chauhan</surname>
              <given-names>MS</given-names>
            </name>
            <name>
              <surname>Skarbrevik</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Ra</surname>
              <given-names>HK</given-names>
            </name>
            <name>
              <surname>Bajaj</surname>
              <given-names>V</given-names>
            </name>
            <name>
              <surname>Ahmad</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <comment>UQLM: a Python package for uncertainty quantification in large language models. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2507.06196. <uri xlink:href="https://doi.org/10.48550/arXiv.2507.06196">https://doi.org/10.48550/arXiv.2507.06196</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B226">
        <label>226</label>
        <nlm-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Krasecki</surname>
              <given-names>VK</given-names>
            </name>
            <name>
              <surname>Sharma</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Cavell</surname>
              <given-names>AC</given-names>
            </name>
            <etal />
          </person-group>
          <article-title>The role of experimental noise in a hybrid classical-molecular computer to solve combinatorial optimization problems</article-title>
          <source>ACS Cent Sci</source>
          <year>2023</year>
          <volume>9</volume>
          <fpage>1453</fpage>
          <lpage>65</lpage>
          <pub-id pub-id-type="doi">10.1021/acscentsci.3c00515</pub-id>
          <pub-id pub-id-type="pmid">37521801</pub-id>
          <pub-id pub-id-type="pmcid">PMC10375572</pub-id>
        </nlm-citation>
      </ref>
      <ref id="B227">
        <label>227</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Choubey</surname>
              <given-names>PK</given-names>
            </name>
            <name>
              <surname>Huang</surname>
              <given-names>KH</given-names>
            </name>
            <name>
              <surname>Xiong</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Wu</surname>
              <given-names>CS</given-names>
            </name>
          </person-group>
          <comment>Agentic uncertainty quantification. <italic>arXiv</italic> <bold>2026</bold>, arXiv:2601.15703. <uri xlink:href="https://doi.org/10.48550/arXiv.2601.15703">https://doi.org/10.48550/arXiv.2601.15703</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B228">
        <label>228</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Bougzime</surname>
              <given-names>O</given-names>
            </name>
            <name>
              <surname>Jabbar</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Cruz</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Demoly</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <comment>Unlocking the potential of generative AI through neuro-symbolic architectures: benefits and limitations. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2502.11269. <uri xlink:href="https://doi.org/10.48550/arXiv.2502.11269">https://doi.org/10.48550/arXiv.2502.11269</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B229">
        <label>229</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Shen</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Xi</surname>
              <given-names>Z</given-names>
            </name>
            <etal />
          </person-group>
          <comment>SciAgentGym: benchmarking multi-step scientific tool-use in LLM agents. <italic>arXiv</italic> <bold>2026</bold>, arXiv:2602.12984. <uri xlink:href="https://doi.org/10.48550/arXiv.2602.12984">https://doi.org/10.48550/arXiv.2602.12984</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B230">
        <label>230</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Xu</surname>
              <given-names>W</given-names>
            </name>
            <name>
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
            <name>
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
            <etal />
          </person-group>
          <comment>Probing scientific general intelligence of LLMs with scientist-aligned workflows. <italic>arXiv</italic> <bold>2025</bold>, arXiv:2512.16969. <uri xlink:href="https://doi.org/10.48550/arXiv.2512.16969">https://doi.org/10.48550/arXiv.2512.16969</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B231">
        <label>231</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Chaturvedi</surname>
              <given-names>SS</given-names>
            </name>
            <name>
              <surname>Bergerson</surname>
              <given-names>J</given-names>
            </name>
            <name>
              <surname>Mallick</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <comment>Toward reliable, safe, and secure LLMs for scientific applications. <italic>arXiv</italic> <bold>2026</bold>, arXiv:2603.18235. <uri xlink:href="https://doi.org/10.48550/arXiv.2603.18235">https://doi.org/10.48550/arXiv.2603.18235</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
      <ref id="B232">
        <label>232</label>
        <nlm-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Zhao</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Tang</surname>
              <given-names>X</given-names>
            </name>
            <name>
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
            <etal />
          </person-group>
          <comment>ChemSafetyBench: benchmarking LLM safety on chemistry domain. <italic>arXiv</italic> <bold>2024</bold>, arXiv:2411.16736. <uri xlink:href="https://doi.org/10.48550/arXiv.2411.16736">https://doi.org/10.48550/arXiv.2411.16736</uri>. (accessed 2026-05-19)</comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>