<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Archiving and Interchange DTD v1.0 20120330//EN" "JATS-archivearticle1.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta />
    <article-meta>
      <title-group>
        <article-title>Introduction to the Fourth Workshop on Humanities-Centred Artificial Intelligence</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author">
          <string-name>Sylvia Melzer</string-name>
          <email>sylvia.melzer@uni-hamburg.de</email>
          <xref ref-type="aff" rid="aff10">10</xref>
          <xref ref-type="aff" rid="aff11">11</xref>
          <xref ref-type="aff" rid="aff12">12</xref>
          <xref ref-type="aff" rid="aff13">13</xref>
          <xref ref-type="aff" rid="aff2">2</xref>
          <xref ref-type="aff" rid="aff3">3</xref>
          <xref ref-type="aff" rid="aff4">4</xref>
          <xref ref-type="aff" rid="aff5">5</xref>
          <xref ref-type="aff" rid="aff6">6</xref>
          <xref ref-type="aff" rid="aff7">7</xref>
          <xref ref-type="aff" rid="aff8">8</xref>
          <xref ref-type="aff" rid="aff9">9</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Hagen Peukert</string-name>
          <email>hagen.peukert@uni-hamburg.de</email>
          <xref ref-type="aff" rid="aff1">1</xref>
          <xref ref-type="aff" rid="aff10">10</xref>
          <xref ref-type="aff" rid="aff11">11</xref>
          <xref ref-type="aff" rid="aff12">12</xref>
          <xref ref-type="aff" rid="aff13">13</xref>
          <xref ref-type="aff" rid="aff5">5</xref>
          <xref ref-type="aff" rid="aff6">6</xref>
          <xref ref-type="aff" rid="aff7">7</xref>
          <xref ref-type="aff" rid="aff8">8</xref>
          <xref ref-type="aff" rid="aff9">9</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Stefan Thiemann</string-name>
          <email>stefan.thiemannt@uni-hamburg.de</email>
          <xref ref-type="aff" rid="aff1">1</xref>
          <xref ref-type="aff" rid="aff10">10</xref>
          <xref ref-type="aff" rid="aff11">11</xref>
          <xref ref-type="aff" rid="aff12">12</xref>
          <xref ref-type="aff" rid="aff13">13</xref>
          <xref ref-type="aff" rid="aff5">5</xref>
          <xref ref-type="aff" rid="aff6">6</xref>
          <xref ref-type="aff" rid="aff7">7</xref>
          <xref ref-type="aff" rid="aff8">8</xref>
          <xref ref-type="aff" rid="aff9">9</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Erik Radisch</string-name>
          <email>radisch@saw-leipzig.de</email>
          <xref ref-type="aff" rid="aff0">0</xref>
          <xref ref-type="aff" rid="aff10">10</xref>
          <xref ref-type="aff" rid="aff11">11</xref>
          <xref ref-type="aff" rid="aff12">12</xref>
          <xref ref-type="aff" rid="aff13">13</xref>
          <xref ref-type="aff" rid="aff5">5</xref>
          <xref ref-type="aff" rid="aff6">6</xref>
          <xref ref-type="aff" rid="aff7">7</xref>
          <xref ref-type="aff" rid="aff8">8</xref>
          <xref ref-type="aff" rid="aff9">9</xref>
        </contrib>
        <aff id="aff0">
          <label>0</label>
          <institution>Sächsische Akademie der Wissenschaften zu Leipzig</institution>
          ,
          <addr-line>Karl-Tauchnitz-Str. 1, 04107 Leipzig</addr-line>
          ,
          <country country="DE">Germany</country>
        </aff>
        <aff id="aff1">
          <label>1</label>
          <institution>University of Hamburg, Center for Sustainable Research Data Management</institution>
          ,
          <addr-line>Monetastraße 4, 20146 Hamburg</addr-line>
          ,
          <country country="DE">Germany</country>
        </aff>
        <aff id="aff2">
          <label>2</label>
          <institution>University of Hamburg, Centre for the Study of Manuscript Cultures (CSMC)</institution>
          ,
          <addr-line>Warburgstraße 26, 20354 Hamburg</addr-line>
          ,
          <country country="DE">Germany</country>
        </aff>
        <aff id="aff3">
          <label>3</label>
          <institution>University of Hamburg, Cluster of Excellence 'Understanding Written Artefacts' (UWA)</institution>
          ,
          <addr-line>Warburgstraße 26, 20354 Hamburg</addr-line>
          ,
          <country country="DE">Germany</country>
        </aff>
        <aff id="aff4">
          <label>4</label>
          <institution>University of Hamburg, Institute for Humanities-Centered AI (CHAI)</institution>
          ,
          <addr-line>Warburgstraße 28, 20354 Hamburg</addr-line>
          ,
          <country country="DE">Germany</country>
        </aff>
        <aff id="aff5">
          <label>5</label>
          <institution>Dr Erik Radisch, Sächsische Akademie der Wissenschaften zu Leipzig</institution>
        </aff>
        <aff id="aff6">
          <label>6</label>
          <institution>Dr Erik Radisch, Sächsische Akademie der Wissenschaften zu Leipzig</institution>
        </aff>
        <aff id="aff7">
          <label>7</label>
          <institution>Dr Hagen Peukert, Universität Hamburg</institution>
        </aff>
        <aff id="aff8">
          <label>8</label>
          <institution>Dr Hagen Peukert, Universität Hamburg</institution>
        </aff>
        <aff id="aff9">
          <label>9</label>
          <institution>Dr Stefan Thiemann, Universität Hamburg</institution>
        </aff>
        <aff id="aff10">
          <label>10</label>
          <institution>Dr Stefan Thiemann, Universität Hamburg</institution>
        </aff>
        <aff id="aff11">
          <label>11</label>
          <institution>Dr Sylvia Melzer, Universität Hamburg &amp; Universität zu Lübeck</institution>
        </aff>
        <aff id="aff12">
          <label>12</label>
          <institution>Prof Dr habil Meike Klettke, Universität Regensburg</institution>
        </aff>
        <aff id="aff13">
          <label>13</label>
          <institution>Thomas Asselborn, Universität Hamburg</institution>
        </aff>
      </contrib-group>
      <abstract>
        <p>Artificial Intelligence (AI), as the science of agents acting in the world, ofers significant support to research in the Humanities by enhancing eficiency and efectiveness. By adopting a Humanities-centered approach, scholars can tailor AI methods to specific needs. AI methods, developed within the science of human-machine interaction, can assist in interpreting ancient cultural traditions from written artefacts, optimizing processes such as text mining and linguistic analysis. The practical implementation of methods, derived from the science of AI, requires focused development to address specific Humanities challenges and optimize human-machine interaction in this field.</p>
      </abstract>
    </article-meta>
  </front>
  <body>
    <sec id="sec-1">
      <title>-</title>
      <p>1. Organising Committee
2. Program Committee</p>
    </sec>
    <sec id="sec-2">
      <title>3. Preface</title>
      <p>
        Our view of artificial intelligence (AI) is the science of agents acting in the world. [
        <xref ref-type="bibr" rid="ref1">1</xref>
        ]. Agents receive
precepts from the environment and take action. [
        <xref ref-type="bibr" rid="ref2">2</xref>
        ] An intelligent agent does an action with the aim to
achieve a local optimum. Achieving a local optimum implies the focus on maximizing performance
within a specific environment or task while recognizing that global optimization may be impractical or
unnecessary in some cases. In many real-world scenarios, the goal is not absolutely perfect but ”good
enough“ solutions that meet the needs of the current context.
      </p>
      <p>
        AI is currently on a grand triumphant advance in all parts of society. This advance does not stop at the
humanities. Humanities-Centred Artificial Intelligence (CHAI) was suggested as an emerging paradigm
in the article [
        <xref ref-type="bibr" rid="ref3">3</xref>
        ], and in the fourth CHAI workshop, we will highlight human-machine interactions
through a series of current research projects that emphasise the role of data usability, computational
methods and the use of large language models (LLMs) [4, 5] in various research areas, especially in the
humanities and law.
      </p>
      <p>The article [6] deals with the application of (intelligent) agents in the digital humanities, especially
in the field of text analysis. It emphasises that such agents ofer new possibilities for analysing and
interpreting texts that complement and support the work of humanities scholars rather than replacing it.
The focus of the CHAI contributions is also on complementing and supporting the work of humanities
scholars. The use of intelligent agents in the humanities requires close collaboration between humanities
scholars and AI experts, which can lead to new insights and methods in both fields, as the following
articles also demonstrate.</p>
      <p>The first paper Automate Text Processing for Schematically Analyzing Legal Texts presents an innovative
approach to the use of LLMs for processing legal texts and addresses their limitations. Given the
complexity and constant evolution of legal documents, the authors propose a method for automatically
extracting schematic representations that enables intelligent agents to make informed decisions based on
structured information. The method includes a legal case study and outlines a process for modelling and
extracting these schemas using LLMs. The paper also evaluates the capabilities of ChatGPT and Gemini
in this context. While the authors focus primarily on legal texts, they suggest that their approach could
be adapted for diferent types of natural language texts to improve decision making in diferent domains.</p>
      <p>The second article From Data Acquisition to Latent Semantic Analysis: Developing VERITRACE’s
Computational Approach to Tracing the Influence of Ancient Wisdom in Early Modern Natural Philosophy
focuses on the application of latent semantic analysis (LSA) [7] to uncover historical connections and
influences. This computational approach not only contributes to a better understanding of ancient
philosophies, but also illustrates the broader implications of LSA when analysing large text corpora.</p>
      <p>The third article Retrieving Information Presented on Webpages Using Large Language Models: A Case
Study demonstrates the potential of LLMs in improving information retrieval from digital sources. This
is in line with ongoing research on the potential of LLMs to improve the accessibility and usability of
data in various domains.</p>
      <p>The forth article Testing the Syntactic Competence of Large Language Models with a Translation Task
includes a discussion of the use of translation tasks as a method for testing the syntactic competence
of LLMs, particularly in the treatment of dative ambiguity in Russian. This research emphasises the
importance of language processing in the evaluation of agents’ LLMs and their ability to process complex
linguistic structures.</p>
      <p>In the fifth article Tracing the Palola Shahi Royal Genealogy by Fusing LLMs and Databases?: A Case
Study, research into tracing royal genealogies, such as the Pal.ola S.a¯hi lineage (for more details see
[8, 9]), through the fusion of LLMs and databases illustrates the innovative applications of agents in
historical research. This case study highlights the potential of interdisciplinary collaboration that
combines computational techniques with historical research.</p>
      <p>The first invited article Humanities in the Center of Data Usability: Data Visualization in Institutional
Research Repositories sets the stage by emphasizing the critical need for efective data visualization
techniques that enhance the reusability and interoperability of research datasets. In addition, an
innovative citation approach is presented that makes it possible to refer not only to the entire repository,
but also to a specific data set. The second invited article on Human-Centred Open-Source Automatic Text
Recognition for the Humanities with OCR4all emphasizes the need for user-friendly tools that empower
researchers in the humanities to a mass data analysis using software tools efectively. Both contributions
are in line with the general trend towards the development of open source and generic solutions that
improve the findability, accessibility, interoperability and reusability of data.</p>
      <p>In summary, these articles give an overview about the significant advances in data utilisation according
to FAIR principles, computational methods and the use of LLMs, and demonstrate their impact on
diferent areas of research. The integration of LLMs into legal and humanities research not only
streamlines processes but also opens up new ways of study and understanding.</p>
    </sec>
    <sec id="sec-3">
      <title>4. Presentations</title>
      <p>Abstracts and presentations are available at: https://doi.org/10.25592/uhhfdm.15984
Keynote: Humanities in the Center of Data Usability: Data Visualization in Institutional
Research Repositories
Hagen Peukert, Lucas Voges, Sylvia Melzer
From Data Acquisition to Latent Semantic Analysis: Developing VERITRACE’s
Computational Approach to Tracing the Influence of Ancient Wisdom in Early Modern Natural
Philosophy
Jefrey Wolf Vrije
Automate Text Processing for Schematically Analyzing Legal Texts
Magnus Bender
Retrieving Information Presented on Webpages Using Large Language Models: A Case Study
Thomas Asselborn, Karsten Helmholz, Ralf Möller
Testing the Syntactic Competence of Large Language Models with a Translation Task
Edyta Jurkiewicz-Rohrbacher
Tracing the Palola Shahi Royal Genealogy by Fusing LLMs and Databases?: A Case Study
Hui Xu, Thomas Asselborn, Haiyan Hu-von Hinüber, Oskar von Hinüber, Sylvia Melzer
Invited presentation: Human-Centred Open-Source Automatic Text Recognition for the
Humanities with OCR4all
Christian Reul, Maximilian Nöth, Herbert Baier, Florian Langhanki, Kevin Chadbourne</p>
    </sec>
    <sec id="sec-4">
      <title>Funding Information</title>
      <p>This contribution was partially funded by the Deutsche Forschungsgemeinschaft (DFG, German Research
Foundation) under Germany´s Excellence Strategy – EXC 2176 ‘Understanding Written Artefacts:
Material, Interaction and Transmission in Manuscript Cultures’, project no. 390893796. The research
was mainly conducted within the scope of the Centre for the Study of Manuscript Cultures (CSMC) at
Universität Hamburg.
[4] A. Vaswani, N. Shazeer, N. Parmar, J. Uszkoreit, L. Jones, A. N. Gomez, . Kaiser, I. Polosukhin,
Attention is all you need, in: Advances in Neural Information Processing Systems, 2017, pp.
5998–6008.
[5] OpenAI, Better language models and their implications, 2019. URL: https://openai.com/blog/
better-language-models/, archived from the original on 2020-12-19.
[6] J. Chun, K. Elkins, The crisis of artificial intelligence: A new digital humanities curriculum for
human-centred ai, International Journal of Humanities and Arts Computing 17 (2023) 147–167.
doi:10.3366/ijhac.2023.0310.
[7] S. Deerwester, S. T. Dumais, G. W. Furnas, T. K. Landauer, R. Harshman, Indexing by latent semantic
analysis, Journal of the American society for information science 41 (1990) 391–407.
[8] W. Luo, O. von Hinüber, News from palola: The jokhang and the yong-he inscriptions of
surendra¯ditya, in: N. Kudo (Ed.), Śa¯ntamatih. - Manuscripts for Life, volume 15 of Bibliotheca
Philologica et Philosophica Buddhica, International Research Institute for Advanced Buddhology,
Soka University, Tokyo, 2023, pp. 207–223.
[9] O. von Hinüber, Die Palola s.a¯his: Ihre Steininschriften, Inschriften auf Bronzen,
Handschriftenkolophone und Schutzzauber: Materialien zur Geschichte von Gilgit und Chilas, Antiquities of
Northern Pakistan, Heidelberg Academy of Sciences and Humanities, Mainz, 2016. URL: https:
//d-nb.info/1123441529/34.</p>
    </sec>
  </body>
  <back>
    <ref-list>
      <ref id="ref1">
        <mixed-citation>
          [1]
          <string-name>
            <given-names>S.</given-names>
            <surname>Melzer</surname>
          </string-name>
          , R. Möller, GenAI in Education, Science, and
          <string-name>
            <surname>Society</surname>
          </string-name>
          (13 Vorlesungen, University of Hamburg),
          <source>Präsentationen/Dias</source>
          ,
          <year>2024</year>
          . URL: https://www.edit.fis.uni-hamburg.de/ws/files/56466394/ GenAI_2024.zip.
        </mixed-citation>
      </ref>
      <ref id="ref2">
        <mixed-citation>
          [2]
          <string-name>
            <given-names>S.</given-names>
            <surname>Russell</surname>
          </string-name>
          ,
          <string-name>
            <given-names>P.</given-names>
            <surname>Norvig</surname>
          </string-name>
          ,
          <source>Artificial Intelligence: A Modern Approach</source>
          , 3 ed.,
          <source>Prentice Hall</source>
          ,
          <year>2010</year>
          .
        </mixed-citation>
      </ref>
      <ref id="ref3">
        <mixed-citation>
          [3]
          <string-name>
            <given-names>R.</given-names>
            <surname>Möller</surname>
          </string-name>
          ,
          <string-name>
            <surname>Humanities-Centred Artificial</surname>
          </string-name>
          <article-title>Intelligence (CHAI) as an Emerging Paradigm</article-title>
          , De Gruyter, Berlin, Boston,
          <year>2021</year>
          , pp.
          <fpage>245</fpage>
          -
          <lpage>266</lpage>
          . URL: https://doi.org/10.1515/
          <fpage>9783110753301</fpage>
          -
          <lpage>013</lpage>
          . doi:doi:10. 1515/
          <fpage>9783110753301</fpage>
          -
          <lpage>013</lpage>
          .
        </mixed-citation>
      </ref>
    </ref-list>
  </back>
</article>