Hoppa till huvudinnehåll

BibTeX

@inProceedings{Berdicevskis-Aleksandrs2020-290636,
	title        = {Older English Words Are More Polysemous},
	booktitle    = {The Evolution of Language: Proceedings of the 13th International Conference (EvoLang13). Pp. 14-21},
	author       = {Berdicevskis, Aleksandrs},
	year         = {2020},
	publisher    = {The Evolution of Language Conferences },
	address      = {Nijmegen },
}

@incollection{Berdicevskis-Aleksandrs2020-296607,
	title        = {Kogda morfologija bessil'na},
	booktitle    = {VAProsy jazykoznanija: megasbornik nanostatej},
	author       = {Berdicevskis, Aleksandrs},
	year         = {2020},
	publisher    = {Buki-Vedi},
	address      = {Moskva},
	ISBN         = {978-5-4465-2882-0},
	pages        = {56--60},
}

@incollection{Berdicevskis-Aleksandrs2020-296274,
	title        = {Different trajectories of morphological overspecification and irregularity under imperfect language learning},
	booktitle    = {The Complexities of Morphology / edited by Peter Arkadiev and Francesco Gardani},
	author       = {Berdicevskis, Aleksandrs and Semenuks, Arturs},
	year         = {2020},
	publisher    = {Oxford University Press},
	address      = {Oxford},
	ISBN         = {9780198861287},
	pages        = {283--305},
}

@inProceedings{Berdicevskis-Aleksandrs2020-293349,
	title        = {A Diachronic Treebank of Russian Spanning More Than a Thousand Years},
	booktitle    = {Proceedings of the 12th Conference on Language Resources and Evaluation (LREC 2020), May 11-16, 2020, Marseille, France / ed. Nicoletta Calzolari (Conference chair). },
	author       = {Berdicevskis, Aleksandrs and Eckhoff, Hanne},
	year         = {2020},
	publisher    = {European Language Resources Association},
	address      = {Paris},
	ISBN         = {979-10-95546-34-4},
}

@article{Roberts-Sean2020-292421,
	title        = {CHIELD: the causal hypotheses in evolutionary linguistics database},
	journal      = {Journal of Language Evolution},
	author       = {Roberts, Sean and Killin, Anton and Deb, Angarika and Sheard, Catherine and Greenhill, Simon and Sinnemäki, Kaius and Segovia-Martin, José and Nölle, Jonas and Berdicevskis, Aleksandrs and Humphreys-Balkwill, Archie and Little, Hannah and Opie, Cristopher and Jacques, Guillaume and Bromham, Lindell and Tinits, Peeter and Ross, Robert and Lee, Sean and Gasser, Emily and Calladine, Jasmine and Spike, Matthew and Mann, Stephen and Shcherbakova, Olena and Singer, Ruth and Zhang, Shuya and Benítez-Burraco, Antonio and Kliesch, Christian and Thomas-Colquhoun, Ewan and Skirgård, Hedvig and Tamariz, Monica and Passmore, Sam and Pellard, Thomas and Jordan, Fiona},
	year         = {2020},
	volume       = {5},
	number       = {2},
	pages        = {101–120},
}

@inProceedings{Derzhanski-Ivan2004-289179,
	title        = {O perevodimosti lingvisticheskih zadach: Uroki Pervoj mezhdunarodnoj lingvisticheskoj olimpiady},
	booktitle    = {Komp'juternaja lingvistika i intellektual'nye texnologii (Dialogue-2004). Trudy konferencii, 166–171.},
	author       = {Derzhanski, Ivan and Berdicevskis, Aleksandrs and Gilyarova, Kseniya and Iomdin, Boris and Rubinshtein, Maria},
	year         = {2004},
}

@inProceedings{Boguslavsky-Igor2005-289178,
	title        = {Interactive Resolution of Intrinsic and Translational Ambiguity in a Machine Translation System},
	booktitle    = {Lecture Notes in Computer Science (3406)},
	author       = {Boguslavsky, Igor and Iomdin, Leonid and Lazursky, Alexander and Mityushin, Leonid and Sizov, Viktor and Kreydlin, Leonid and Berdicevskis, Aleksandrs},
	year         = {2005},
	publisher    = {Springer},
	ISBN         = {978-3-540-30586-6},
}

@inProceedings{Boguslavskij-Igor2005-288992,
	title        = {Interaktivnoe razreshenie neodnoznachnosti razlichnyx tipov v mashinnom perevode},
	booktitle    = {In Komp'juternaja lingvistika i intellektual'nye texnologii  (Dialogue-2005). Trudy konferencii, 216–221.},
	author       = {Boguslavskij, Igor and Iomdin, Leonid and Lazurskij, Aleksandr and Mitjushin, Leonid and Berdicevskis, Aleksandrs},
	year         = {2005},
}

@incollection{Lazurskij-Aleksandr2005-288980,
	title        = {Interaktivnoe razreshenie leksicheskoj i sintaksicheskoj neodnoznachnosti v sistemah avtomaticheskoj obrabotki estestvennogo jazyka},
	booktitle    = {Internet-matematika 2005: sistemy obrabotki veb-dannyh},
	author       = {Lazurskij, Aleksandr and Berdicevskis, Aleksandrs and Krejdlin, Leonid and Mitjushin, Leonid and Sizov, Viktor},
	year         = {2005},
	pages        = {44--66},
}

@incollection{Berdicevskis-Aleksandrs2007-287992,
	title        = {Punktuacija kak sredstvo razreshenija neodnoznachnosti},
	booktitle    = {Struktury i interpretacii: raboty molodyx issledovatelej po teoreticheskoj i prikladnoj lingvistike},
	author       = {Berdicevskis, Aleksandrs},
	year         = {2007},
	ISBN         = {978-5-211-05488-2},
	pages        = {11--32},
}

@inProceedings{Berdicevskis-Aleksandrs2007-287989,
	title        = {Rol' punktuacii v razreshenii neodnoznachnosti},
	booktitle    = {Komp'juternaja lingvistika i intellektual'nye texnologii (Dialogue-2007). Trudy konferencii, 44–49},
	author       = {Berdicevskis, Aleksandrs and Iomdin, Boris},
	year         = {2007},
}

@inProceedings{Iomdin-Boris2006-287988,
	title        = {A kto ètot ètot? Imena sobstvennye i opredelennaja neopredelennost’},
	booktitle    = {Komp'juternaja lingvistika i intellektual'nye texnologii (Dialogue- 2006). Trudy konferencii, 196–201.},
	author       = {Iomdin, Boris and Berdicevskis, Aleksandrs},
	year         = {2006},
}

@inProceedings{Iomdin-Boris2007-287986,
	title        = {Combinations of Probability Qualifiers in Russian},
	booktitle    = {Meaning - Text theory 2007: proceedings of the 3rd International Conference on Meaning - Text Theory, 189-198},
	author       = {Iomdin, Boris and Berdicevskis, Aleksandrs},
	year         = {2007},
}

@inProceedings{Berdicevskis-Aleksandrs2011-287907,
	title        = {E-mail vs. Chat: The influence of the communication channel on the language.},
	booktitle    = {Computational linguistics and intellectual technologies. Papers from the annual international conference "Dialogue","Dialogue", 10: 84-93},
	author       = {Berdicevskis, Aleksandrs},
	year         = {2011},
}

@misc{Berdicevskis-Aleksandrs2011-287904,
	title        = {Doubts About a Serial Founder-Effect Model of Language Expansion},
	author       = {Berdicevskis, Aleksandrs and Piperski, Aleksandr},
	year         = {2011},
}

@inProceedings{Berdicevskis-Aleksandrs2012-287867,
	title        = {Introducing pressure for expressivity into language evolution experiments},
	booktitle    = {The Evolution of Language: Proceedings of the 9th International Conference on the Evolution of Language, 64-71},
	author       = {Berdicevskis, Aleksandrs},
	year         = {2012},
	publisher    = {World Scientific},
	address      = {Singapore},
	ISBN         = {9781299742437},
}

@inProceedings{Berdicevskis-Aleksandrs2014-287581,
	title        = {Verbal constructional profiles: reliability, distinction power and practical applications.},
	abstract     = {In this paper we explore the notion of constructional profiles (the frequency distribution of a given linguistic item across syntactic environments) from two angles, methodological and applied. We concentrate on verbal constructional profiles, using Russian argument frame data in two different dependency formats. We first test the profiles’ stability and distinction power across sample sizes, and then use the profiles in two tasks concerning Russian aspect: to identify the aspectual partner of a given verb and to guess whether a given verb is perfective or imperfective.},
	booktitle    = {In Proceedings of the Thirteenth International Workshop on Treebanks and Linguistic Theories, 2–13},
	author       = {Berdicevskis, Aleksandrs and Eckhoff, Hanne},
	year         = {2014},
}

@article{Eckhoff-Hanne2015-287287,
	title        = {Linguistics vs. digital editions: The Tromsø Old Russian and OCS Treebank},
	abstract     = {This article provides a description of the Tromsø Old Russian and OCS Treebank (TOROT), which, along with its parent treebank, the PROIEL corpus (built by members of the project Pragmatic Resources in Old Indo-European Languages), is the only existing treebank of Old Church Slavonic, Old East Slavic and Middle Russian texts. The TOROT is a part of a larger family of treebanks of ancient languages which all use the PROIEL open-source annotion web tool and annotation schemes. In this article we present principles and selected problems at several levels of analysis in the TOROT, and then briefly discuss ways that corpus linguists and edition philologists can fruitfully collaborate and complement each other.},
	journal      = {Scripta & e-Scripta},
	author       = {Eckhoff, Hanne and Berdicevskis, Aleksandrs},
	year         = {2015},
	number       = {14-15},
	pages        = {9--25},
}

@inProceedings{Berdicevskis-Aleksandrs2015-287288,
	title        = {Estimating Grammeme Redundancy by Measuring Their Importance for Syntactic Parser Performance.},
	abstract     = {Redundancy is an important psycholinguistic concept which is often used for explanations of language change, but is notoriously difficult to operationalize and measure. Assuming that the reconstruction of a syntactic structure by a parser can be used as a rough model of the understanding of a sentence by a human hearer, I propose a method for estimating redundancy. The key idea is to compare performances of a parser on a given treebank before and after artificially removing all information about a certain grammeme from the morphological annotation. The change in performance can be used as an estimate for the redundancy of the grammeme. I perform an experiment, applying MaltParser to an Old Church Slavonic treebank to estimate grammeme redundancy in Proto-Slavic. The results show that those Old Church Slavonic grammemes within the case, number and tense categories that were estimated as most redundant are those that disappeared in modern Russian. Moreover, redundancy estimates serve as a good predictor of case grammeme frequencies in modern Russian. The small sizes of the samples do not allow to make definitive conclusions for number and tense.},
	booktitle    = {Proceedings of the Sixth Workshop on Cognitive Aspects of Computational Language Learning, 65–73},
	author       = {Berdicevskis, Aleksandrs},
	year         = {2015},
	publisher    = {Association for Computational Linguistics},
}

@inProceedings{Berdicevskis-Aleksandrs2015-287516,
	title        = {Automatic identification of shared arguments in verbal coordinations.},
	booktitle    = {Computational linguistics and intellectual technologies. Papers from the annual international conference "Dialogue", 14: 33–43},
	author       = {Berdicevskis, Aleksandrs and Eckhoff, Hanne},
	year         = {2015},
}

@inProceedings{Bentz-Christian2016-286983,
	title        = {Learning pressures reduce morphological complexity: Linking corpus, computational and experimental evidence.},
	abstract     = {The morphological complexity of languages differs widely and changes over time. Pathways of
change are often driven by the interplay of multiple competing factors, and are hard to disentangle. We here focus on a paradigmatic scenario of language change: the reduction of morphological complexity from Latin towards the Romance languages. To establish a causal explanation for
this phenomenon, we employ three lines of evidence: 1) analyses of parallel corpora to measure
the complexity of words in actual language production, 2) applications of NLP tools to further
tease apart the contribution of inflectional morphology to word complexity, and 3) experimental
data from artificial language learning, which illustrate the learning pressures at play when morphology simplifies. These three lines of evidence converge to show that pressures associated with
imperfect language learning are good candidates to causally explain the reduction in morphological complexity in the Latin-to-Romance scenario. More generally, we argue that combining
corpus, computational and experimental evidence is the way forward in historical linguistics and
linguistic typology.},
	booktitle    = {Proceedings of the Workshop on Computational Linguistics for Linguistic Complexity (CL4LC at COLING 2016): 222–232},
	author       = {Bentz, Christian and Berdicevskis, Aleksandrs},
	year         = {2016},
	publisher    = {Association for Computational Linguistics},
}

@inProceedings{Eckhoff-Hanne2016-287182,
	title        = {Automatic parsing as an efficient pre-annotation tool for historical texts},
	abstract     = {Historical treebanks tend to be manually annotated, which is not surprising, since state-of-the-art parsers are not accurate enough to ensure high-quality annotation for historical texts. We test whether automatic parsing can be an efficient pre-annotation tool for Old East Slavic texts. We use the TOROT treebank from the PROIEL treebank family. We convert the PROIEL format to the CONLL format and use MaltParser to create syntactic pre-annotation. Using the most conservative evaluation method, which takes into account PROIEL-specific features, MaltParser by itself yields 0.845 unlabelled attachment score, 0.779 labelled attachment score and 0.741 secondary dependency accuracy (note, though, that the test set comes from a relatively simple genre and contains rather short sentences). Experiments with human annotators show that preparsing, if limited to sentences where no changes to word or sentence boundaries are required, increases their annotation rate. For experienced annotators, the speed gain varies from 5.80% to 16.57%, for inexperienced annotators from 14.61% to 32.17% (using conservative estimates). There are no strong reliable differences in the annotation accuracy, which means that there is no reason to suspect that using preparsing might lower the final annotation quality.},
	booktitle    = {Proceedings of the Workshop on Language Technology Resources and Tools for Digital Humanities (LT4DH at COLING 2016): 62–70.},
	author       = {Eckhoff, Hanne and Berdicevskis, Aleksandrs},
	year         = {2016},
	publisher    = {Association for Computational Linguistics},
}

@inProceedings{Eckhoff-Hanne2016-287184,
	title        = {From diachronic treebank to dictionary resource: the Varangian Rus' project},
	booktitle    = {Proceedings of the EURALEX 2016 conference: 335–340},
	author       = {Eckhoff, Hanne and Berdicevskis, Aleksandrs},
	year         = {2016},
	publisher    = {Ivane Javakhishvili Tbilisi State University},
}

@inProceedings{Berdicevskis-Aleksandrs2016-287185,
	title        = {The beginning of a beautiful friendship: rule-based and statistical analysis of Middle Russian},
	booktitle    = {Computational linguistics and intellectual technologies. Papers from the annual international conference "Dialogue", 15: 99–111},
	author       = {Berdicevskis, Aleksandrs and Eckhoff, Hanne and Gavrilova, Tatjana},
	year         = {2016},
	publisher    = {Russian State University for the Humanities},
}

@inProceedings{Berdicevskis-Aleksandrs2016-287286,
	title        = {Redundant features are less likely to survive: empirical evidence from the Slavic languages},
	abstract     = {We test whether the functionality (non-redundancy) of morphological features can serve as a predictor of the survivability of those features in the course of language change. We apply a recently proposed method of measuring functionality of a feature by estimating its importance for the performance of an automatic parser to the Slavic language group. We find that the functionality of a Common Slavic grammeme, together with the functionality of its category, is a significant predictor of its survivability in modern Slavic languages. The least functional grammemes within the most functional categories
are most likely to die out.},
	booktitle    = {The Evolution of Language: Proceedings of the 11th International Conference (EVOLANG11), 69–77},
	author       = {Berdicevskis, Aleksandrs and Eckhoff, Hanne},
	year         = {2016},
	ISBN         = {978-1-326-61450-8},
}

@inProceedings{Berdicevskis-Aleksandrs2018-286919,
	title        = {Using Universal Dependencies in cross-linguistic complexity research},
	abstract     = {We evaluate corpus-based measures of linguistic complexity obtained using Universal Dependencies (UD) treebanks. We propose a method of estimating robustness of the complexity values obtained using a given measure and a given treebank. The results indicate that measures of syntactic complexity might be on average less robust than those of morphological complexity. We also estimate the validity of complexity measures by comparing the results for very similar languages and checking for
unexpected differences. We show that some of those differences that arise can be diminished by using parallel treebanks and, more importantly from the practical point of view, by harmonizing the language-specific solutions in the UD annotation.},
	booktitle    = {Proceedings of the Second Workshop on Universal Dependencies (UDW 2018), 8–17},
	author       = {Berdicevskis, Aleksandrs and Çöltekin, Çağrı and Ehret, Katharina and von Prince, Kilu and Ross, Daniel and Thompson, Bill and Yan, Chunxiao and Demberg, Vera and Lupyan, Gary and Rama, Taraka and Bentz, Christian},
	year         = {2018},
	publisher    = {Association for Computational Linguistics},
}

@misc{Berdicevskis-Aleksandrs2018-286979,
	title        = {Proceedings of the First Shared Task on Measuring Language Complexity},
	author       = {Berdicevskis, Aleksandrs and Bentz, Christian},
	year         = {2018},
	ISBN         = { 978-91-639-7435-9},
}

@incollection{Berdicevskis-Aleksandrs2012-287865,
	title        = {«Orfograficheskij» srednij rod: grammaticheskaja innovacija v jazyke russkogo Interneta},
	booktitle    = {Variativnost’ v jazyke i kommunikacii},
	author       = {Berdicevskis, Aleksandrs},
	year         = {2012},
	ISBN         = {9785728113430},
	pages        = {51–72},
}

@incollection{Berdicevskis-Aleksandrs2014-287584,
	title        = {Slangs Go Online, or The Rise and Fall of the Olbanian language.},
	booktitle    = {Digital Russia: The Language, Culture and Politics of New Media Communication},
	author       = {Berdicevskis, Aleksandrs and Zvereva, Vera},
	year         = {2014},
	publisher    = {Routledge},
	ISBN         = {978-0415707046},
	pages        = {122--140},
}

@incollection{Berdicevskis-Aleksandrs2014-287583,
	title        = {The written turn: how computer-mediated communication actuates linguistic change in Russian.},
	booktitle    = {Digital Russia: The Language, Culture, and Politics of New Media Communication},
	author       = {Berdicevskis, Aleksandrs},
	year         = {2014},
	publisher    = {Routledge},
	ISBN         = {978-0415707046},
	pages        = {107–122},
}

@article{Berdicevskis-Aleksandrs2017-286981,
	title        = {M. Baerman, D. Brown, G. G. Corbett (eds.). Understanding and measuring morphological complexity.},
	journal      = {Voprosy jazykoznanija - Journal of the Institute of Linguistics of the Russian Academy of Sciences},
	author       = {Berdicevskis, Aleksandrs},
	year         = {2017},
	number       = {5},
	pages        = {123--135},
}

@article{Berdicevskis-Aleksandrs2012-287862,
	title        = {Jazykovaja slozhnost’},
	journal      = {Voprosy jazykoznanija - Journal of the Institute of Linguistics of the Russian Academy of Sciences},
	author       = {Berdicevskis, Aleksandrs},
	year         = {2012},
	number       = {5},
	pages        = {101--124},
}

@book{Berdicevskis-Aleksandrs2013-287751,
	title        = {Language Change Online: Linguistic Innovations in Russian Induced by Computer-Mediated Communication.},
	author       = {Berdicevskis, Aleksandrs},
	year         = {2013},
	ISBN         = {978-82-308-2334-7},
}

@incollection{Berdicevskis-Aleksandrs2014-287749,
	title        = {"Ty chto-to pechatala, ja tebja perebil": igra so strukturoj dialoga v kvazisinxronnoj kommunikacii},
	booktitle    = {Sovremennyj russkij jazyk v internete},
	author       = {Berdicevskis, Aleksandrs},
	year         = {2014},
	publisher    = {Jazyki slavjanskoj kul'tury},
	ISBN         = { 978-5-9551-0722-6},
	pages        = {61--82},
}

@incollection{Berdicevskis-Aleksandrs2014-287748,
	title        = {Predictors of pluricentricity: lexical divergences between Latvian Russian and Russian Russian.},
	booktitle    = {The Russian Language Outside the Nation},
	author       = {Berdicevskis, Aleksandrs},
	year         = {2014},
	publisher    = {Edinburgh University Press},
	ISBN         = {9780748668458},
	pages        = {225–246},
}

@misc{Berdicevskis-Aleksandrs2020-297688,
	title        = {Pizzas and vermouth},
	author       = {Berdicevskis, Aleksandrs},
	year         = {2020},
	publisher    = {Faber & Faber},
	ISBN         = {9781783352203},
	pages        = {150--151},
}

@inProceedings{Berdicevskis-Aleksandrs2020-297403,
	title        = {Subjects tend to be coded only once: Corpus-based and grammar-based evidence for an efficiency-driven trade-off},
	booktitle    = {Proceedings of the 19th International Workshop on Treebanks and Linguistic Theories, TLT 2020, 27–28 October 2020, Düsseldorf, Germany},
	author       = {Berdicevskis, Aleksandrs and Schmidtke-Bode, Karsten and Seržant, Ilja},
	year         = {2020},
	publisher    = {Association for Computational Linguistics},
	address      = {Stroudsburg, PA},
	ISBN         = { 978-1-952148-01-9},
}

@inProceedings{Berdicevskis-Aleksandrs2020-297766,
	title        = {Foreigner-directed speech is simpler than native-directed: Evidence from social media},
	booktitle    = {Proceedings of the Fourth Workshop on Natural Language Processing and Computational Social Science, NLP+CSS 2020, November 20, 2020, Online. Pp. 163-172},
	author       = {Berdicevskis, Aleksandrs},
	year         = {2020},
	publisher    = {Association for Computational Linguistics},
	ISBN         = {978-1-952148-80-4},
}

@inProceedings{Veeman-Hartger2020-297782,
	title        = {Cross-lingual Embeddings Reveal Universal and Lineage-Specific Patterns in Grammatical Gender Assignment},
	booktitle    = {Proceedings of the 24th Conference on Computational Natural Language Learning, Online, November 19-20, 2020. Pp. 265-275},
	author       = {Veeman, Hartger and Allassonnière-Tang, Marc and Berdicevskis, Aleksandrs and Basirat, Ali},
	year         = {2020},
	publisher    = {Association for Computational Linguistics},
	ISBN         = {978-1-952148-63-7},
}

@inProceedings{Berdicevskis-Aleksandrs2020-298524,
	title        = {Corpus evidence for word order freezing in Russian and German},
	booktitle    = {Proceedings of the Fourth Workshop on Universal Dependencies (UDW 2020), December 13, 2020, Barcelona, Spain (Online) / Marie-Catherine de Marneffe, Miryam de Lhoneux, Joakim Nivre, Sebastian Schuster (Editors). Pp. 26-33},
	author       = {Berdicevskis, Aleksandrs and Piperski, Alexander},
	year         = {2020},
	publisher    = {Association for Computational Linguistics},
	ISBN         = { 978-1-952148-48-4},
}

@techreport{Adesam-Yvonne2020-299130,
	title        = {SwedishGLUE – Towards a Swedish Test Set for Evaluating Natural Language Understanding Models},
	author       = {Adesam, Yvonne and Berdicevskis, Aleksandrs and Morger, Felix},
	year         = {2020},
	publisher    = {University of Gothenburg},
}

@inProceedings{Adesam-Yvonne2021-304973,
	title        = {Part-of-speech tagging of Swedish texts in the neural era},
	booktitle    = {Proceedings of the 23rd Nordic Conference on Computational Linguistics, NoDaLiDa, May 31–2 June, 2021, Reykjavik, Iceland (online) / eds Simon Dobnik and Lilja Øvrelid},
	author       = {Adesam, Yvonne and Berdicevskis, Aleksandrs},
	year         = {2021},
	publisher    = { Linköping University Electronic Press},
	address      = {Linköping},
	ISBN         = { 978-91-7929-614-8},
}

@article{Ehret-Katharina2021-304914,
	title        = {Meaning and Measures: Interpreting and Evaluating Complexity Metrics},
	journal      = {Frontiers in communication},
	author       = {Ehret, Katharina and Blumenthal-Dramé, Alice and Bentz, Christian and Berdicevskis, Aleksandrs},
	year         = {2021},
	volume       = {6},
}

@article{Basirat-Ali2021-302492,
	title        = {An empirical study on the contribution of formal and semantic features to the grammatical gender of nouns},
	abstract     = {This study conducts an experimental evaluation of two hypotheses about the contributions of formal and semantic features to the grammatical gender assignment of nouns. One of the hypotheses (Corbett and Fraser 2000) claims that semantic features dominate formal ones. The other hypothesis, formulated within the optimal gender assignment theory (Rice 2006), states that form and semantics contribute equally. Both hypotheses claim that the combination of formal and semantic features yields the most accurate gender identification. In this paper, we operationalize and test these hypotheses by trying to predict grammatical gender using only character-based embeddings (that capture only formal features), only context-based embeddings (that capture only semantic features) and the combination of both. We performed the experiment using data from three languages with different gender systems (French, German and Russian). Formal features are a significantly better predictor of gender than semantic ones, and the difference in prediction accuracy is very large. Overall, formal features are also significantly better than the combination of form and semantics, but the difference is very small and the results for this comparison are not entirely consistent across languages.},
	journal      = {Linguistics Vanguard},
	author       = {Basirat, Ali and Allassonnière-Tang, Marc and Berdicevskis, Aleksandrs},
	year         = {2021},
	volume       = {7},
	number       = {1},
}

@book{Berdicevskis-Aleksandrs2021-311612,
	title        = {Tri skljanki popoludni i drugie zadachi po lingvistike},
	author       = {Berdicevskis, Aleksandrs and Piperski, Alexander},
	year         = {2021},
	publisher    = {Alpina Non-Fiction},
	address      = {Moskva},
	ISBN         = {978-5-00139-130-2},
}

@inProceedings{Berdicevskis-Aleksandrs2021-311655,
	title        = {Successes and failures of Menzerath’s law at the syntactic level},
	booktitle    = {Second Workshop on Quantitative Syntax (Quasy, SyntaxFest 2021). Proceedings, pp. 17--32.},
	author       = {Berdicevskis, Aleksandrs},
	year         = {2021},
	publisher    = {Association for Computational Linguistics},
	ISBN         = { 978-1-955917-15-5},
}