@inProceedings{broden-etal-2025-distant-356669,
title = {A Distant Technology? Experiments with a Generative Model
for Retouching Noisy Newspaper OCR},
abstract = {This paper explores the use of generative language models to enhance digitized historical newspaper
text. While large language models offer new means of addressing noisy OCR, their opaque,
probabilistic processes raise epistemological concerns. Within the project The Order of Criticism
Revisited, which integrates literary and computational approaches to Swedish criticism, we tested
GPT-4o to “retouch” OCR data from the National Library of Sweden using zero-shot prompting.
Comparisons with flawed OCR outputs and manually transcribed texts show that the model
produced more legible versions, often closer to the originals than the raw OCR. This indicates
potential for improving the quality of digitized sources and enabling more robust large-scale
analysis. At the same time, drawing on the notions of artificial communication and distant
technology, we argue that such models extend analytical capacity while creating perceptual and
methodological distance. Their outputs, better seen as probabilistic “retouching” than correction or
reconstruction, weaken the indexical link to original sources.},
booktitle = {HiC 2025: Huminfra Conference 12–13 November, 2025 Stockholm, Sweden},
author = {Brodén, Daniel and Samuelsson, Lina and Alfter, David and Malmstedt, Johan},
year = {2025},
pages = {1--7},
}
@inProceedings{broden-etal-2025-between-349707,
title = {Between the Arduous and the Automatic: A Comparative Approach to the Challenge of Classifying of Book Reviews in Swedish Newspapers},
abstract = {This paper examines the methodological challenges of identifying literary book reviews in newspapers, contrasting manual and automated approaches. By discussing the manual, and 'traditional,' approach of a previous literature study alongside computational methods for classifying book reviews, we explore how human and automated approaches provide complementary perspectives on this task with a focus on the National Library of Sweden's historical newspaper collection. Along with different findings, the paper highlights key issues related to the arbitrariness of ‘what constitutes a book review,’ digitisation and annotation issues and differences between frequency-based and BERT methods. We conclude by suggesting that nuanced text mining of specific types of newspaper articles benefits from considering both contextual and computational perspectives, which can together enhance our understanding of the complexities involved.},
booktitle = {Digital Humanities in the Nordic and Baltic Countries 2024, May 27-31, 2024, Reykjavik, Iceland},
author = {Brodén, Daniel and Samuelsson, Lina and Zechner, Niklas and Ingvarsson, Jonas and Karimi, Aram},
year = {2025},
publisher = {University of Oslo Library},
address = {Oslo},
}
@inProceedings{broden-etal-2025-politics-349710,
title = {The Politics of Compound Neologisms: A Novel Text-Mining Approach for Tracing Conceptual Transformations in Parliamentary Discourse and Data},
abstract = {This paper highlights the underutilized analytical potential of compounds and neologisms as indicators of discursive change in text mining applications, particularly in the study of parliamentary discourse and conceptual transformation. Drawing on results from two research projects, this project-wide paper discusses how compound neologisms function as markers of discursive change through case studies focused on the formation, frequency, and productivity of compounds related to the key concepts of 'market' and 'terrorism' in the Swedish Parliament. The analysis combines distant reading techniques to identify large-scale trends and close reading to examine the specific contexts of these compounds. By focusing on compound formation, we emphasize the analytical potential of basic linguistic features often overlooked in Digital Humanities research, offering a fresh perspective on large parliamentary datasets and their role in tracing conceptual transformations over time.},
booktitle = {Parliamentary Data in Action (DiPaDA 2024) workshop, Reykjavik, Iceland, May 28, 2024.},
author = {Brodén, Daniel and Ohlsson, Claes and Ängsal, Magnus Pettersson and Björck, Henrik and Fridlund, Mats and Olsson, Leif-Jöran and Runefelt, Leif and Virk, Shafqat Mumtaz},
year = {2025},
publisher = {University of Oslo Library},
address = {Oslo},
pages = {35--49},
}
@inProceedings{olsson-etal-2025-augmented-349766,
title = {Augmented Analysis of Parliamentary Debates: The Word Embedding and Context-sensitive Approach of the SweTerror Project},
abstract = {This paper delves into the SweTerror project’s use of word vectors to enhance the analysis of parliamentary debates concerning terrorism in Sweden during the electoral periods from 1968 to 2018. We focus on how word embeddings capture semantic shifts and the evolving context of key concepts like terror, terrorism, and extremism over time. By combining these computational tools with enriched metadata and document annotation as well as a mixed-methods and context-sensitive approach, we trace temporal changes in parliamentary discourse. The study demonstrates how generating vectors for distinct periods, such as electoral periods or parliamentary years, provides nuanced insights into conceptual transformations, including the introduction of the modern use of the concept of terrorism in the 1970s and the impact of the term violence-affirming extremism in the context of Islamism in the 2010s. We conclude by stressing that this approach allows for a more sophisticated analysis of linguistic and discursive patterns within Swedish parliamentary discourse.},
booktitle = {Digital Parliamentary Data in Action (DiPaDA 2024) Workshop},
author = {Olsson, Leif-Jöran and Brodén, Daniel and Ängsal, Magnus Pettersson and Fridlund, Mats and Öhberg, Patrik},
year = {2025},
pages = {90–105},
}
@inProceedings{westin-etal-2025-digicure-357671,
title = {DigiCURE: Building a Digital Humanities Infrastructure for Preserving and Studying At-risk Cultural Heritage},
booktitle = {Proceedings of the 2nd Huminfra Conference. HiC 2025},
author = {Westin, Jonathan and Lindhé, Cecilia and Brodén, Daniel and Tomasini, Matteo and Almevik, Gunnar},
year = {2025},
}
@incollection{broden-etal-2025-interdisciplinary-356666,
title = {Interdisciplinary digital project design},
abstract = {While discussions in digital humanities increasingly emphasise the importance of reflecting on collaborative workflows for interdisciplinary research, attention to specific practical expertise remains lacking. This paper introduces the concept of interdisciplinary digital project design to highlight a professional practice that integrates collaboration between traditional Humanities and Social Science (HSS) researchers and technical experts in developing research projects, digital resources and more. We begin by addressing the need for protocols to support workflow-oriented approaches to interdisciplinary collaboration, while underscoring the role of embodied expertise in facilitating teamwork. Furthermore, we argue that judgement – a critical yet often overlooked element – is an integral aspect of the professionalism involved. The discussion is grounded in descriptions of our contribution to five digital HSS projects, each offering a different perspective on the integrative professionalism involved. The paper concludes by discussing ways to further advance the conceptual understanding of interdisciplinary digital project design, with particular attention to the expertise that underpins this practice.},
booktitle = {Huminfra handbook: Empowering digital and experimental humanities / Gerlof Bouma, Dana Dannélls, Dimitrios Kokkinakis & Elena Volodina (eds.)},
author = {Brodén, Daniel and Fridlund, Mats and Lindhé, Cecilia and Westin, Jonathan},
year = {2025},
publisher = {University of Tartu Library},
address = {Tartu},
ISBN = {978-99-0853-612-5},
pages = {57--76},
}
@article{samuelsson-etal-2025-barnlitteraturkritikens-356665,
title = {Barnlitteraturkritikens ordning: Recensioner av barnlitteratur i svenska dagstidningar och bloggar 2006 och 2016},
abstract = {Based on computational analyses of book reviews of children’s literature in relation to other literary criticism from the years 2006 and 2016 in daily press and book blogs, this study examines the discursive order of children’s book reviews. The study is inspired by the analytical model employed by Lina Samuelsson in Kritikens ordning (2013). Specifically we focus on the characteristics of children’s book criticism and questions whether it differs from other literary reviews, and if so, how. The article identifies several essential features present in children’s book reviews, and discusses possible differences between reviews in the daily press and those on book blogs. We conclude that our mixed-methods approach-“computational” combined with “traditional”-allows us to highlight both similarities and differences between children’s literature criticism and literary criticism in general, and that there is value in examining children’s book reviewing from both digital and traditional perspectives.},
journal = {Barnboken},
author = {Samuelsson, Lina and Brodén, Daniel and Ingvarsson, Jonas and Karimi, Aram},
year = {2025},
volume = {48},
}
@article{fridlund-etal-2025--349767,
title = {人文主义人工智能:一个跨学科的专业知识与研究新领域},
abstract = {The Gothenburg Research Infrastructure in Digital Humanities (GRIDH) have participated in projects within various humanities fields that utilise as well as develop research tools and infrastructural resources that incorporate applications of ‘artificial intelligence’ (AI). These applications can include natural language processing, machine learning, computer vision, large language models, image recognition algorithms, classification, clustering, and deep learning. This paper advances the term ‘humanistic AI’ to describe an emergent form of interdisciplinary practice that uses and develops AI-based research applications to answer humanities research questions together with its entangled humanistic reflection. We coin this term to make implicit and visible the epistemological and material particularities of its practice and the new forms of knowledge its affordances make possible. The paper presents GRIDH projects within ‘humanistic AI’ together with its developed AI resources and applications.},
journal = {数字人文研究 / Digital Humanities Research},
author = {Fridlund, Mats and Alfter, David and Brodén, Daniel and Green, Ashely and Karimi, Aram and Lindhé, Cecilia},
year = {2025},
volume = {5},
number = {1},
pages = {3--10},
}
@misc{broden-etal-2025-digital-349765,
title = {Digital Parliamentary Data in Action (DiPaDA 2024) Workshop},
author = {Brodén, Daniel and Fridlund, Mats and La Mela, Matti and Wendsjö, Albert},
year = {2025},
publisher = {University of Oslo},
address = {Oslo},
}
@misc{broden-etal-2025-digital-349764,
title = {Digital Parliamentary Data in Action (DiPaDA 2024): Introduction},
abstract = {The workshop Digital Parliamentary Data in Action 2024 (DiPaDa 2024) took place in Reykjavik, Iceland, on 28 May, co-located with The 8th Digital Humanities in the Nordic and Baltic Countries Conference(DHNB 2024). The workshop, along with its predecessor organised in Uppsala in 2022, supports the advancement of research using parliamentary datasets, which present both opportunities and challenges for interdisciplinary research and infrastructure development especially in the digital humanities and social sciences.},
author = {Brodén, Daniel and Fridlund, Mats and La Mela, Matti and Wendsjö, Albert},
year = {2025},
volume = {7},
number = {1},
pages = {1--6},
}