Skip to main content
Språkbanken Text is a department within Språkbanken.

BibTeX

@article{cousse-etal-2023-anvands-332468,
	title        = {Hur används de, dem och dom i nutida skriftspråk? En storskalig korpusundersökning av nyheter och sociala medier},
	abstract     = {This study ties in with a longstanding debate on the Swedish spelling variants de, dem and dom for personal pronouns (third person plural) and definite articles (plural). It charts the usage of de, dem and dom in five large corpora with news and social media texts over the past 25 years. The corpora contain more than 1.5 billion tokens, which rules out manual handling of the data. Instead,  this  study  makes  use  of  computational  methods  (including  an  AI  language  model)  to  automatically identify and classify relevant observations. Analysis of the news corpora shows a relatively stable usage of de, dem and dom over the past 25 years. The forms de and dem are predominantly used according to the norm: de for pronouns in subject position and as a definite article; dem for pronouns in object position. The colloquial form dom is hardly found in news texts.  Analysis  of  the  social  media  corpora  shows  more  variation  and  change.  The  colloquial  form dom is used in 5–25% of all instances instead of de  or  dem  and  has  decreased  after  an  initial rise. The forms de and dem are sometimes used in a non-standard way: de occurs in object position in 4–10% of the observations; dem is found in subject position or as a definite article in 1–7% of the cases. Non-standard dem is potentially on the rise with younger writers. The corpus analysis also provides details on the usage of de and dem in relative clauses, and on the users’ ratings of posts containing de, dem and dom on the social media platform Reddit},
	journal      = {Språk & Stil},
	author       = {Coussé, Evie and Adesam, Yvonne and Rekathati, Faton and Berdicevskis, Aleksandrs},
	year         = {2023},
	volume       = {NF 33},
	pages        = {39--70},
}

@inProceedings{bloomstrom-etal-2023-preparing-328710,
	title        = {Preparing a corpus of spoken Xhosa},
	booktitle    = {Proceedings of the 2023 CLASP Conference on Learning with Small Data (LSD), Gothenburg and online 11–12 September 2023},
	author       = {Bloom Ström, Eva-Marie and Slater, Onelisa and Zahran, Aron and Berdicevskis, Aleksandrs and Schumacher, Anne},
	year         = {2023},
	publisher    = {Association for Computational Linguistics},
	address      = {Gothenburg, Sweden},
	ISBN         = {979-8-89176-000-4},
	pages        = {62--67},
}

@inProceedings{volodina-etal-2023-dalaj-326817,
	title        = {DaLAJ-GED – a dataset for Grammatical Error Detection tasks on Swedish},
	booktitle    = {Proceedings of the 12th Workshop on Natural Language Processing for Computer Assisted Language Learning (NLP4CALL 2023)},
	editor       = {David Alfter and Elena Volodina and Thomas François and Arne Jönsson and Evelina Rennes},
	author       = {Volodina, Elena and Ali Mohammed, Yousuf and Berdicevskis, Aleksandrs and Bouma, Gerlof and Öhman, Joey},
	year         = {2023},
	publisher    = { Linköping Electronic Conference Proceedings},
	address      = {Linköping },
	ISBN         = {978-91-8075-250-3},
	pages        = {94--101},
}

@inProceedings{berdicevskis-etal-2023-superlim-331445,
	title        = {Superlim: A Swedish Language Understanding Evaluation Benchmark},
	booktitle    = {Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, December 6-10, 2023, Singapore  / Houda Bouamor, Juan Pino, Kalika Bali (Editors)},
	author       = {Berdicevskis, Aleksandrs and Bouma, Gerlof and Kurtz, Robin and Morger, Felix and Öhman, Joey and Adesam, Yvonne and Borin, Lars and Dannélls, Dana and Forsberg, Markus and Isbister, Tim and Lindahl, Anna and Malmsten, Martin and Rekathati, Faton and Sahlgren, Magnus and Volodina, Elena and Börjeson, Love and Hengchen, Simon and Tahmasebi, Nina},
	year         = {2023},
	publisher    = {Association for Computational Linguistics},
	address      = {Stroudsburg, PA},
	ISBN         = {979-8-89176-060-8},
	pages        = {8137--8153},
}

@inProceedings{berdicevskis-erbro-2023-tomato-326355,
	title        = {You say tomato, I say the same: A large-scale study of linguistic accommodation in online communities},
	booktitle    = {Proceedings of the 24th Nordic Conference on Computational Linguistics (NoDaLiDa)},
	author       = {Berdicevskis, Aleksandrs and Erbro, Viktor},
	year         = {2023},
	publisher    = {University of Tartu Library},
	ISBN         = {978-99-1621-999-7},
	pages        = {415--424},
}

@misc{cousse-etal-2023-inget-324690,
	title        = {Inget stöd i forskningen för att de/dem slås ut},
	author       = {Coussé, Evie and Adesam, Yvonne and Berdicevskis, Aleksandrs},
	year         = {2023},
	number       = {2023-03-20},
}

@article{ehret-etal-2023-measuring-326113,
	title        = {Measuring language complexity: challenges and opportunities},
	journal      = {Linguistics Vanguard},
	author       = {Ehret, Katharina and Berdicevskis, Aleksandrs and Bentz, Christian and Blumenthal-Dramé, Alice},
	year         = {2023},
	volume       = {9},
	pages        = {1--8},
}

@misc{ehret-etal-2023-measuring-326620,
	title        = {Measuring Language Complexity},
	author       = {Ehret, Katharina and Berdicevskis, Aleksandrs and Bentz, Christian and Blumenthal-Dramé, Alice},
	year         = {2023},
	volume       = {9},
	number       = {s1},
	pages        = {1--167},
}