@misc{b6d4a0ee0068483098561757643ee110,
title = "TAMAR – Transcriptions & Annotations for MAnuscript Research: Einf{\"u}hrung",
abstract = "TAMAR steht f{\"u}r Transcription and Annotation for MAnuscript Research. TAMAR erm{\"o}glicht es, Handschriftendigitalisate mit Transkriptionen von Textelementen oder weiteren Informationen darzustellen. Arbeitstranskriptionen zu ausgew{\"a}hlten Passagen von Biblia-pauperum-Handschriften bilden das Datenkorpus bei der Ver{\"o}ffentlichung im Jahr 2025. TAMAR ist ein Kooperationsprojekt des Projekts FNT08, Reframing Old Contents for New Readers in Late-Medieval German OneVolume Libraries (Wimmer/Ratzke 2023) und dem Research Field F, Data Linking im Exzellenzcluster Understanding Written Artefacts am Centre for the Study of Manuscript Cultures Hamburg (CSMC).Bereitgestellt werden neben der Einf{\"u}hrung, den Transkriptionsrichtlinien und den Transkriptionsdaten (10.25592/uhhfdm.17566) drei Ansichten in der Webanwendung TAMAR (10.25592/tamar): Zwei Interfaces mit Auswahlm{\"o}glichkeiten f{\"u}r die zu visualisierenden Daten sowie ein Viewer, der die Auswahl als interaktive, annotierte digitale Faksimiles mit Transkriptionen der Textelemente anzeigt.",
keywords = "Biblia-pauperum, Transkription, Annotation, Manuskript",
author = "Malena Ratzke and Hanna Wimmer and Ralf M{\"o}ller and Stefan Thiemann",
year = "2025",
month = jun,
day = "3",
doi = "10.25592/uhhfdm.17566",
language = "Deutsch",
}
@article{02c53b332ccf448c84741b4e41f7bf00,
title = "Building sustainable information systems and transformer models on demand",
abstract = "The growing practice of archiving research data in repositories reflects an upward trend. However, storing data in an RDR (Research Data Repository) does not guarantee that the archived data will always be readily reusable, even if this fulfils the FAIR (Findable, Accessible, Interoperable, Reusable) principles. To ensure sustainable RDM (Research Data Management), archiving must consider the future potential for data reuse in a low-threshold fashion. In this article, we demonstrate the utilisation of straightforward methods to implement a so-called warm or hot archiving for research data within an RDR, as opposed to the conventional cold archiving approach. We explore the additional value of using research data in the humanities, emphasising the advantages of maintaining data accessibility and relevance over time. In the humanities, evaluating numerous data sets efficiently is crucial for current and future projects. Reviewing and evaluating relevance is important, particularly when dealing with a substantial number of data sets. Rapid evaluation facilitates profound decisions on the utility of the data for one{\textquoteright}s ongoing or upcoming projects. For hot archiving, this means that in addition to the research data, the data should be available in a human-friendly way, i.e., a viewer application to visualise the data should be easily accessible. However, as rapid developments in the IT sector mean that after a few years, it cannot be guaranteed that these viewers or other tools will work, we also show how data can be viewed in a user-specific way via the RDR and how sustainable viewing can be integrated into the RDR. This article presents a generic approach to building sustainable viewers, which we call information systems, or transformer models on demand using data from pre-modern Arabic. In addition, we show that the easy-to-use chatbot ChatGPT can alternatively be context-specifically prepared to deliver more precise results and associated resources in the field of humanities. On the one hand, we have achieved a substantial reduction in the development time of an information system, from months to seconds, as well as the ability to fine-tune BERT (Bidirectional Encoder Representations from Transformers) models without specific knowledge in selecting models or tools. On the other hand, we have developed a chatbot that not only provides project-specific responses but also references the sources.",
author = "Thomas Asselborn and Sylvia Melzer and Simon Schiff and Magnus Bender and Florian Marwitz and Said Aljoumani and Stefan Thiemann and Konrad Hirschler and Ralf M{\"o}ller",
year = "2025",
month = feb,
day = "15",
doi = "10.1057/s41599-025-04491-x",
language = "English",
volume = "12",
journal = "Humanities and Social Sciences Communications",
issn = "2662-9992",
publisher = "Springer Nature",
number = "1",
}
@inbook{91751cc3d5eb462183d04265387802ba,
title = "Introduction to the Fourth Workshop on Humanities-Centred Artificial Intelligence",
abstract = "Artificial Intelligence (AI) can support research in the Humanities making it easier and more efficient. It is thus essential that AI practitioners and Humanities scholars take a Humanities-centred approach to the development, deployment and application of AI methods for the Humanities.Inferring ancient cultural traditions from written artefacts, AI offers many opportunities to assist humanities scholars in their work. Editorial projects and computer-aided evaluations, such as text and data mining or linguistic analyses, require the collecting, storing, and linking of data in order to quickly identify core information of the written artefacts under investigation. Time-consuming procedures like the creation of dictionaries or the use of bibliographies can be facilitated, abridged and designed more efficiently through the automatic linking of data, which enables to create extensive data sets and to generate additional information. In this way, AI supports scholars with time-saving methods for their research, hence leaving more room for core tasks and questions. To ensure that the use of AI methods in the humanities remains not only abstract and theoretic, the applicability of algorithms in respective research needs to be specifically examined and intentionally developed with a clear focus on humanities research.",
author = "Sylvia Melzer and Hagen Peukert and Stefan Thiemann and Erik Radisch",
year = "2024",
month = oct,
day = "30",
language = "Deutsch",
volume = "3814",
pages = "1--4",
editor = "Sylvia Melzer and Hagen Peukert and Stefan Thiemann and Erik Radisch",
booktitle = "Proceedings of the Workshop on Humanities-Centred Artificial Intelligence (CHAI 2024)",
publisher = "CEUR-WS.org",
note = "4th Workshop on Humanities-Centred Artificial Intelligence: 47th German Conference on Artificial Intelligence, CHAI 2024 ; Conference date: 23-09-2024 Through 24-09-2024",
url = "https://www.csmc.uni-hamburg.de/ki2024-chai",
}
@book{745f913877b5431a871ad6990b3b2ba5,
title = "Proceedings of the 4th Workshop on Humanities-Centred Artificial 2024 (CHAI 2024)",
author = "Sylvia Melzer and Hagen Peukert and Stefan Thiemann and Erik Radisch",
year = "2024",
month = oct,
day = "30",
language = "English",
volume = "3814",
publisher = "CEUR-WS.org",
note = "4th Workshop on Humanities-Centred Artificial Intelligence: 47th German Conference on Artificial Intelligence ; Conference date: 23-09-2024 Through 24-09-2024",
url = "https://www.csmc.uni-hamburg.de/ki2024-chai",
}
@article{ae6cf57d46eb4d56bc762c3f86a960b4,
title = "Implementation of a Federated Information System by means of Reuse of Research Data archived in Research Data Repositories",
abstract = "At universities, research data is increasingly stored in research data repositories according to a data management plan (DMP) and thus made available for further use. The challenge of reusing hundreds, thousands, or millions of data sets is to obtain an overview of the data in a short period of time and to search through all the data. The high variability of the formats used to store research data requires a new approach to data reusability that focuses on the visualisation and searchability of archived research data, which can also be combined with each other. In this article, we present a practical DMP that describes how information systems can be created on demand by reusing research data archived in research data repositories and how these systems can be merged into a federated information system. As a result, in our projects, information systems have been created in minutes or a couple of hours with few resources. The initial effort to create a federated system remains; however, this allows federated searches to be performed. Extending a federated system to include other information systems can then be accomplished by making a few configurations and manageable adjustments to the source code.",
keywords = "FAIR principles, data management plan, databasing on demand, federated information system",
author = "Sylvia Melzer and Stefan Thiemann and Simon Schiff and Ralf M{\"o}ller",
year = "2023",
month = oct,
day = "12",
doi = "10.5334/dsj-2023-039",
language = "English",
volume = "22",
journal = "Data Science Journal",
issn = "1683-1470",
publisher = "Ubiquity Press",
number = "39",
}
@conference{ab76ed7049b54b03a2fe0bcb889f1df6,
title = "Digital Data Handling at UWA",
author = "Sylvia Melzer and Stefan Thiemann and Ralf M{\"o}ller",
year = "2023",
month = sep,
language = "Deutsch",
note = "Digital Total ; Conference date: 09-10-2023 Through 10-10-2023",
url = "https://www.conferences.uni-hamburg.de/event/387/",
}
@article{d0d7e0145c024e608d68c2b14a5d63a5,
title = "Das Forschungsdatenzentrum der Universit{\"a}t Hamburg: Auf dem Weg zu einem gemeinsamen Verst{\"a}ndnis im Umgang mit Forschungsdaten in den Natur-, Sozial- und Geisteswissenschaften",
abstract = "Die Umsetzung und Etablierung eines generischen Forschungsdatenmanagements ander Universit{\"a}t Hamburg folgt dem Ansatz des Kaizen-basierten Continuous Improve-ment Prozesses (CIP)1, bei dem induktiv und kleinschrittig aus disziplinenspezifischenBest-Practices gelernt wird. Der Forschungsdatenlebenzyklus, in dem sich die Prozes-se jeder Disziplin wiederfinden lassen, dient als gemeinsamer Ausgangspunkt. Eben-so werden die strategischen Vorgaben der Universit{\"a}t zum Open Science ber{\"u}cksich-tigt. Dieser Erfahrungsbericht stellt ein Ergebnis des CIPs dar, dessen Hauptaufgabedarin besteht, die Prozesse so zu gestalten und in verschiedenen Softwarel{\"o}sungenabzubilden, dass sich eine stetig wachsende Zahl an disziplinenspezifischen Prakti-ken umsetzen lassen.",
author = "Hagen Peukert and Sylvia Melzer and Juliane Jacob and Iris Vogel and Kai W{\"o}rner and Steffen Gr{\"u}nler and Lisa Brase and Alexander Heinrich and Stefan Thiemann",
year = "2023",
month = may,
day = "31",
doi = "10.17192/BFDM.2023.3.8562",
language = "Deutsch",
volume = "2",
pages = "2--13",
journal = "Bausteine Forschungsdatenmanagement",
number = "3",
}
@inbook{e217c39735f2474da5d9d8c09a5e6e65,
title = "Introduction to the Third Workshop on Humanities-Centred Artificial Intelligence",
author = "Sylvia Melzer and Hagen Peukert and Stefan Thiemann",
year = "2023",
language = "English",
volume = "3580",
series = "CEUR Workshop Proceedings",
publisher = "CEUR-WS.org",
pages = "1--4",
editor = "Sylvia Melzer and Hagen Peukert and Stefan Thiemann",
booktitle = "Proceedings of the Workshop on Humanities-Centred Artificial Intelligence",
}
@book{00491b43fe764f3bb23ad3a5b85873b1,
title = "Proceedings of the Workshop on Humanities-Centred Artificial Intelligence (CHAI 2023)",
editor = "Sylvia Melzer and Hagen Peukert and Stefan Thiemann",
year = "2023",
language = "English",
volume = "3580",
publisher = "CEUR-WS.org",
}
@inbook{bb5a77d738ee4aab8a0f2cc56913eab7,
title = "Towards a Model-based and Variant-oriented Development of a System of Systems",
author = "Sylvia Melzer and Stefan Thiemann and Hagen Peukert and Ralf M{\"o}ller",
year = "2022",
month = may,
day = "25",
doi = "10.25046/aj070303",
language = "English",
volume = "7",
series = "Advances in Science, Technology and Engineering Systems Journal",
pages = "19--31",
editor = "Passerini Kazmersk",
booktitle = "Advances in Science, Technology and Engineering Systems Journal (ASTESJ)",
edition = "3",
}