@inProceedings{berdicevskis-eckhoff-2015-automatic-287516, title = {Automatic identification of shared arguments in verbal coordinations.}, booktitle = {Computational linguistics and intellectual technologies. Papers from the annual international conference "Dialogue", 14: 33–43}, author = {Berdicevskis, Aleksandrs and Eckhoff, Hanne}, year = {2015}, } @article{eckhoff-berdicevskis-2015-linguistics-287287, title = {Linguistics vs. digital editions: The Tromsø Old Russian and OCS Treebank}, abstract = {This article provides a description of the Tromsø Old Russian and OCS Treebank (TOROT), which, along with its parent treebank, the PROIEL corpus (built by members of the project Pragmatic Resources in Old Indo-European Languages), is the only existing treebank of Old Church Slavonic, Old East Slavic and Middle Russian texts. The TOROT is a part of a larger family of treebanks of ancient languages which all use the PROIEL open-source annotion web tool and annotation schemes. In this article we present principles and selected problems at several levels of analysis in the TOROT, and then briefly discuss ways that corpus linguists and edition philologists can fruitfully collaborate and complement each other.}, journal = {Scripta & e-Scripta}, author = {Eckhoff, Hanne and Berdicevskis, Aleksandrs}, year = {2015}, number = {14-15}, pages = {9--25}, } @inProceedings{berdicevskis-2015-estimating-287288, title = {Estimating Grammeme Redundancy by Measuring Their Importance for Syntactic Parser Performance.}, abstract = {Redundancy is an important psycholinguistic concept which is often used for explanations of language change, but is notoriously difficult to operationalize and measure. Assuming that the reconstruction of a syntactic structure by a parser can be used as a rough model of the understanding of a sentence by a human hearer, I propose a method for estimating redundancy. The key idea is to compare performances of a parser on a given treebank before and after artificially removing all information about a certain grammeme from the morphological annotation. The change in performance can be used as an estimate for the redundancy of the grammeme. I perform an experiment, applying MaltParser to an Old Church Slavonic treebank to estimate grammeme redundancy in Proto-Slavic. The results show that those Old Church Slavonic grammemes within the case, number and tense categories that were estimated as most redundant are those that disappeared in modern Russian. Moreover, redundancy estimates serve as a good predictor of case grammeme frequencies in modern Russian. The small sizes of the samples do not allow to make definitive conclusions for number and tense.}, booktitle = {Proceedings of the Sixth Workshop on Cognitive Aspects of Computational Language Learning, 65–73}, author = {Berdicevskis, Aleksandrs}, year = {2015}, publisher = {Association for Computational Linguistics}, }