@inproceedings{c52df6658fa441b6b36f1fbed3d0edd8,
title = "Learning to extract folktale keywords",
abstract = "Manually assigned keywords provide a valuable means for accessing large document collections. They can serve as a shallow document summary and enable more efficient retrieval and aggregation of information. In this paper we investigate keywords in the context of the Dutch Folktale Database, a large collection of stories including fairy tales, jokes and urban legends. We carry out a quantitative and qualitative analysis of the keywords in the collection. Up to 80% of the assigned keywords (or a minor variation) appear in the text itself. Human annotators show moderate to substantial agreement in their judgment of keywords. Finally, we evaluate a learning to rank approach to extract and rank keyword candidates. We conclude that this is a promising approach to automate this time intensive task.",
keywords = "EWI-23556, METIS-297760, IR-87094",
author = "Trieschnigg, {Rudolf Berend} and Dong-Phuong Nguyen and Mariet Theune",
year = "2013",
month = aug,
language = "Undefined",
isbn = "978-1-937284-62-6",
publisher = "Association for Computational Linguistics (ACL)",
pages = "65--73",
editor = "P. Lendvai and K. Zervanou",
booktitle = "Proceedings of the 7th Workshop on Language Technology for Cultural Heritage, Social Sciences, and Humanities (LaTeCH 2013)",
address = "United States",
note = "7th Workshop on Language Technology for Cultural Heritage, Social Sciences, and Humanities, LaTeCH 2013 ; Conference date: 08-08-2013 Through 08-08-2013",
}