Skip to main content
Språkbanken Text is a department within Språkbanken.

BibTeX

@inProceedings{bloomstrom-etal-2023-preparing-328710,
	title        = {Preparing a corpus of spoken Xhosa},
	booktitle    = {Proceedings of the 2023 CLASP Conference on Learning with Small Data (LSD), Gothenburg and online 11–12 September 2023},
	author       = {Bloom Ström, Eva-Marie and Slater, Onelisa and Zahran, Aron and Berdicevskis, Aleksandrs and Schumacher, Anne},
	year         = {2023},
	publisher    = {Association for Computational Linguistics},
	address      = {Gothenburg, Sweden},
	ISBN         = {979-8-89176-000-4},
	pages        = {62--67},
}

@inProceedings{ahlberg-etal-2016-karp-246072,
	title        = {Karp: Språkbanken’s Open Lexical Infrastructure},
	booktitle    = {Globalex 2016, May 24, Portorož, Slovenia},
	author       = {Ahlberg, Malin and Borin, Lars and Forsberg, Markus and Olsson, Olof and Schumacher, Anne and Uppström, Jonatan},
	year         = {2016},
}

@techreport{hammarstedt-etal-2022-sparv-318399,
	title        = {Sparv 5 Developer’s Guide},
	abstract     = {The Sparv Pipeline developed by Språkbanken Text is a text analysis tool run from the command line. 
This Developer’s Guide describes its general structure and key concepts and serves as an API documentation. Most importantly, it  describes how to write plugins for Sparv 5 so that you can add your own functions to the toolkit.},
	author       = {Hammarstedt, Martin and Schumacher, Anne and Borin, Lars and Forsberg, Markus},
	year         = {2022},
}

@techreport{hammarstedt-etal-2022-sparv-318405,
	title        = {Sparv 5 User Manual},
	abstract     = {The Sparv Pipeline developed by Språkbanken Text is a text analysis tool run from the command line. 
This user manual describes how to get Sparv 5 up and running on your own machine, how to configure it and how to use it for annotating your own corpora.},
	author       = {Hammarstedt, Martin and Schumacher, Anne and Borin, Lars and Forsberg, Markus},
	year         = {2022},
	publisher    = {Institutionen för svenska, flerspråkighet och språkteknologi},
	address      = {Göteborg},
}

@inProceedings{ahlberg-etal-2016-sprakbanken's-246063,
	title        = {Språkbanken’s Open Lexical Infrastructure},
	abstract     = {Karp is an open lexical infrastructure and a web based tool for searching, exploring and developing lexical resources. Språkbanken currently hosts a number of lexicons in Karp and on-going work aims at broadening the type of resources that can be developed in the system. This abstract gives a short overview of Karp's basic functionality, and describes some current projects and on-going work.},
	booktitle    = {SLTC 2016. The Sixth Swedish Language Technology Conference. Umeå University, 17-18 November, 2016},
	author       = {Ahlberg, Malin and Borin, Lars and Forsberg, Markus and Olsson, Olof and Schumacher, Anne and Uppström, Jonatan},
	year         = {2016},
}

@techreport{hammarstedt-etal-2017-korp-256055,
	title        = {Korp 6 - Technical Report},
	author       = {Hammarstedt, Martin and Roxendal, Johan and Öhrman, Maria and Borin, Lars and Forsberg, Markus and Schumacher, Anne},
	year         = {2017},
	publisher    = {Institutionen för svenska språket, Göteborgs universitet},
}

@techreport{hammarstedt-etal-2017-korp-256056,
	title        = {Korp 6 - Användarmanual},
	author       = {Hammarstedt, Martin and Borin, Lars and Forsberg, Markus and Roxendal, Johan and Schumacher, Anne and Öhrman, Maria},
	year         = {2017},
	publisher    = {Institutionen för svenska språket, Göteborgs universitet},
}

@inProceedings{borin-etal-2016-sparv-246053,
	title        = {Sparv: Språkbanken’s corpus annotation pipeline infrastructure},
	abstract     = {Sparv is Språkbanken's corpus annotation pipeline infrastructure. The easiest way to use the pipeline is from its web interface with a plain text document. The pipeline uses in-house and external tools on the text to segment it into sentences and paragraphs, tokenise, tag parts-of-speech, look up in dictionaries and analyse compounds. The pipeline can also be run using a web API with XML results, and it is run locally at Språkbanken to prepare the documents in Korp, our corpus search tool. While the most sophisticated support is for modern Swedish, the pipeline supports 15 languages.},
	booktitle    = {SLTC 2016. The Sixth Swedish Language Technology Conference, Umeå University, 17-18 November, 2016},
	author       = {Borin, Lars and Forsberg, Markus and Hammarstedt, Martin and Rosén, Dan and Schäfer, Roland and Schumacher, Anne},
	year         = {2016},
}