h1

h2

h3

h4

h5
h6
% IMPORTANT: The following is UTF-8 encoded.  This means that in the presence
% of non-ASCII characters, it will not work with BibTeX 0.99 or older.
% Instead, you should use an up-to-date BibTeX implementation like “bibtex8” or
% “biber”.

@PHDTHESIS{Ihsan:1018782,
      author       = {Ihsan, Ahmad Zainul},
      othercontributors = {Sandfeld, Stefan and Kerzel, Ulrich Bernd},
      title        = {{E}nabling the digital transformation in materials science
                      and engineering: leveraging ontologies for knowledge
                      representation, provenance, and text mining},
      school       = {Rheinisch-Westfälische Technische Hochschule Aachen},
      type         = {Dissertation},
      address      = {Aachen},
      publisher    = {RWTH Aachen University},
      reportid     = {RWTH-2025-07969},
      pages        = {1 Online-Ressource : Illustrationen},
      year         = {2025},
      note         = {Veröffentlicht auf dem Publikationsserver der RWTH Aachen
                      University; Dissertation, Rheinisch-Westfälische Technische
                      Hochschule Aachen, 2025},
      abstract     = {The digital transformation of Materials Science and
                      Engineering (MSE) is essential for accelerating the
                      development of novel materials and enhancing understanding
                      of the materials life cycle, encompassing raw resources,
                      functional materials, engineered components, and beyond.
                      This transformation entails integrating computational
                      methods, data science, and artificial intelligence (AI) to
                      advance the field of MSE. However, the heterogeneity of data
                      formats, unstructured information, and the reproducibility
                      crisis in MSE pose challenges to the effective management,
                      reuse, and analysis of data. This thesis addresses these
                      challenges by leveraging ontologies as the foundation for
                      semantic data enrichment, facilitating knowledge
                      representation, provenance documentation, and text mining.
                      The first contribution of this work is the development of
                      the Dislocation Ontology (DISO), an ontology that represents
                      the domain knowledge of linear defects in crystalline
                      materials. The development of DISO was driven by the
                      objective of facilitating data interoperability with other
                      MSE-related data. DISO was aligned with the Elementary
                      Multiperspective Material Ontology (EMMO) and Materials
                      Design Ontology (MDO) to ensure interoperability. The
                      ontology alignment efficiently represents the dislocation
                      simulation data. Moreover, we present a real-world use case
                      of representing discrete dislocation dynamics data as a
                      knowledge graph (DisLocKG), which can depict the
                      relationships between them. Additionally, DisLocKG is
                      accessible, as we developed a SPARQL endpoint that offers
                      considerable flexibility when querying DisLocKG. Another
                      contribution of this work is the PRovenance Information for
                      MAterials Science (PRIMA) ontology, which was designed to
                      document provenance information in MSE research, promoting
                      data reliability, trustworthiness, and reproducibility.
                      PRIMA was aligned with the Provenance Ontology (PROV-O) and
                      the Platform Material Digital core ontology (PMDco) and was
                      evaluated through use cases involving metallic biomaterial
                      fabrication and microscopy data. Furthermore, this thesis
                      presents a framework integrating Large Language Models
                      (LLMs) and Semantic Web technologies to extract structured
                      data from unstructured materials synthesis text. Free-text
                      data is transformed into machine-readable formats such as
                      JSON and further enriched semantically using an ontology.
                      The overarching objective of this work is to demonstrate an
                      interdisciplinary approach that integrates MSE knowledge,
                      Semantic Web technologies, and Natural Language Processing
                      (NLP) to facilitate the digital transformation of MSE. The
                      developed ontologies and knowledge graphs are pivotal in
                      data enrichment and interoperability, ensuring that
                      materials data adhere to the FAIR (Findable, Accessible,
                      Interoperable, Reusable) data principles. The LLMs-based
                      text mining framework provides a strategy for handling
                      unstructured data in materials synthesis-related text,
                      enabling the generation of linked data and knowledge
                      extraction. Despite these advances, challenges persist in
                      expanding DISO and DisLocKG to new use cases, refining data
                      models, and improving long-context processing in LLMs.
                      Future works will entail the development of Application
                      Programming Interfaces (APIs) for DisLocKG, extending PRIMA
                      with computational modules, and exploring more efficient
                      LLMs architectures for a more extensive range of text-mining
                      applications. We envision a future where Semantic Web
                      technologies and AI converge to enable machines to extract,
                      process, and understand scientific data, ultimately driving
                      the digital transformation in MSE.},
      cin          = {527210 / 520000},
      ddc          = {620},
      cid          = {$I:(DE-82)527210_20201120$ / $I:(DE-82)520000_20140620$},
      pnm          = {MuDiLingo - A Multiscale Dislocation Language for
                      Data-Driven Materials Science (759419)},
      pid          = {G:(EU-Grant)759419},
      typ          = {PUB:(DE-HGF)11},
      doi          = {10.18154/RWTH-2025-07969},
      url          = {https://publications.rwth-aachen.de/record/1018782},
}