@inProceedings{volodina-etal-2023-dalaj-326817, title = {DaLAJ-GED – a dataset for Grammatical Error Detection tasks on Swedish}, booktitle = {Proceedings of the 12th Workshop on Natural Language Processing for Computer Assisted Language Learning (NLP4CALL 2023)}, editor = {David Alfter and Elena Volodina and Thomas François and Arne Jönsson and Evelina Rennes}, author = {Volodina, Elena and Ali Mohammed, Yousuf and Berdicevskis, Aleksandrs and Bouma, Gerlof and Öhman, Joey}, year = {2023}, publisher = { Linköping Electronic Conference Proceedings}, address = {Linköping }, ISBN = {978-91-8075-250-3}, pages = {94--101}, } @inProceedings{berdicevskis-etal-2023-superlim-331445, title = {Superlim: A Swedish Language Understanding Evaluation Benchmark}, booktitle = {Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, December 6-10, 2023, Singapore / Houda Bouamor, Juan Pino, Kalika Bali (Editors)}, author = {Berdicevskis, Aleksandrs and Bouma, Gerlof and Kurtz, Robin and Morger, Felix and Öhman, Joey and Adesam, Yvonne and Borin, Lars and Dannélls, Dana and Forsberg, Markus and Isbister, Tim and Lindahl, Anna and Malmsten, Martin and Rekathati, Faton and Sahlgren, Magnus and Volodina, Elena and Börjeson, Love and Hengchen, Simon and Tahmasebi, Nina}, year = {2023}, publisher = {Association for Computational Linguistics}, address = {Stroudsburg, PA}, ISBN = {979-8-89176-060-8}, pages = {8137--8153}, } @edited_book{alfter-etal-2023-proceedings-331649, title = {Proceedings of the 12th Workshop on Natural Language Processing for Computer Assisted Language Learning (NLP4CALL 2023) }, abstract = {The workshop series on Natural Language Processing (NLP) for Computer-Assisted Language Learning (NLP4CALL) is a meeting place for researchers working on the integration of Natural Language Processing and Speech Technologies in CALL systems and exploring the theoretical and methodological issues arising in this connection. The latter includes, among others, the integration of insights from Second Language Acquisition (SLA) research, and the promotion of “Computational SLA” through setting up Second Language research infrastructures.}, editor = {Alfter, David and Volodina, Elena and François, Thomas and Jönsson, Arne and Rennes, Evelina}, year = {2023}, publisher = {Linköping University Press}, address = {Linköping}, ISBN = {978-91-8075-250-3}, } @inProceedings{volodina-etal-2023-multiged-331652, title = {MultiGED-2023 shared task at NLP4CALL: Multilingual Grammatical Error Detection }, abstract = {This paper reports on the NLP4CALL shared task on Multilingual Grammatical Error Detection (MultiGED-2023), which included five languages: Czech, English, German, Italian and Swedish. It is the first shared task organized by the Computational SLA1 working group, whose aim is to promote less represented languages in the fields of Grammatical Error Detection and Correction, and other related fields. The MultiGED datasets have been produced based on second language (L2) learner corpora for each particular language. In this paper we introduce the task as a whole, elaborate on the dataset generation process and the design choices made to obtain MultiGED datasets, provide details of the evaluation metrics and CodaLab setup. We further briefly describe the systems used by participants and report the results. }, booktitle = {Proceedings of the 12th Workshop on Natural Language Processing for Computer Assisted Language Learning (NLP4CALL 2023) }, author = {Volodina, Elena and Bryant, Christopher and Caines, Andrew and De Clercq, Orphée and Frey, Jennifer-Carmen and Ershova, Elizaveta and Rosen, Alexandr and Vinogradova, Olga}, year = {2023}, publisher = {Linköping University Press}, } @inProceedings{masciolini-etal-2023-towards-329384, title = {Towards automatically extracting morphosyntactical error patterns from L1-L2 parallel dependency treebanks}, abstract = {L1-L2 parallel dependency treebanks are UD-annotated corpora of learner sentences paired with correction hypotheses. Automatic morphosyntactical annotation has the potential to remove the need for explicit manual error tagging and improve interoperability, but makes it more challenging to locate grammatical errors in the resulting datasets. We therefore propose a novel method for automatically extracting morphosyntactical error patterns and perform a preliminary bilingual evaluation of its first implementation through a similar example retrieval task. The resulting pipeline is also available as a prototype CALL application.}, booktitle = {Proceedings of the 18th Workshop on Innovative Use of NLP for Building Educational Applications (BEA 2023), July 13, 2023, Toronto, Canada}, author = {Masciolini, Arianna and Volodina, Elena and Dannélls, Dana}, year = {2023}, publisher = {Association for Computational Linguistics}, address = {Stroudsburg, PA}, ISBN = {978-1-959429-80-7}, } @inProceedings{volodina-etal-2023-grandma-328176, title = {Grandma Karl is 27 years old – research agenda for pseudonymization of research data}, abstract = {Accessibility of research data is critical for advances in many research fields, but textual data often cannot be shared due to the personal and sensitive information which it con- tains, e.g names or political opinions. General Data Protection Regulation (GDPR) suggests pseudonymization as a solution to secure open access to research data, but we need to learn more about pseudonymization as an approach before adopting it for manipulation of research data. This paper outlines a research agenda within pseudonymization, namely need of studies into the effects of pseudonymization on unstructured data in relation to e.g. readability and language assessment, as well as the effectiveness of pseudonymization as a way of protecting writer identity, while also exploring different ways of developing context-sensitive algorithms for detection, labelling and replacement of personal information in unstructured data. The recently granted project on pseudonymization ‘Grandma Karl is 27 years old’1 addresses exactly those challenges.}, booktitle = {2023 IEEE Ninth International Conference on Big Data Computing Service and Applications (BigDataService), Athens, Greece, 2023}, author = {Volodina, Elena and Dobnik, Simon and Lindström Tiedemann, Therese and Vu, Xuan-Son}, year = {2023}, publisher = {IEEE Computer Society}, address = {Los Alamitos}, ISBN = {979-8-3503-3379-4}, }