@inproceedings{89d139a074d44a8ab01038c3eb848060,
title = "Reconciling Heterogeneous Descriptions of Language Resources",
abstract = "Language resources are a cornerstone of linguistic research and for the development of natural language processing tools, but the discovery of relevant resources remains a challenging task. This is due to the fact that relevant metadata records are spread among different repositories and it is currently impossible to query all these repositories in an integrated fashion, as they use different data models and vocabularies. In this paper we present a first attempt to collect and harmonize the metadata of different repositories, thus making them queriable and browsable in an integrated way. We make use of RDF and linked data technologies for this and provide a first level of harmonization of the vocabularies used in the different resources by mapping them to standard RDF vocabularies including Dublin Core and DCAT. Further, we present an approach that relies on NLP and in particular word sense disambiguation techniques to harmonize resources by mapping values of attributes - such as the type, license or intended use of a resource - into normalized values. Finally, as there are duplicate entries within the same repository as well as across different repositories, we also report results of detection of these duplicates.",
author = "McCrae, \{John P.\} and Philipp Cimiano and Luca Matteis and Roberto Navigli and Doncel, \{Victor Rodr{\'i}guez\} and Daniel Vila-Suero and Jorge Gracia and Andrejs Abele and Gabriela Vulcu and Paul Buitelaar",
note = "Publisher Copyright: {\textcopyright} 2015 Association for Computational Linguistics and Asian Federation of Natural Language Processing.; 4th Workshop on Linked Data in Linguistics: Resources and Applications, LDL 2015 ; Conference date: 31-07-2015",
year = "2015",
language = "English",
series = "Proceedings of the 4th Workshop on Linked Data in Linguistics: Resources and Applications, LDL 2015 - collocated with 53rd Annual Meeting of the Association for Computational Linguistics and the 7th International Joint Conference on Natural Language Processing, ACL-IJCNLP 2015",
publisher = "Association for Computational Linguistics (ACL)",
pages = "39--48",
editor = "Christian Chiarcos and McCrae, \{John Philip\} and Petya Osenova and Philipp Cimiano and Nancy Ide",
booktitle = "Proceedings of the 4th Workshop on Linked Data in Linguistics",
}