@inproceedings{184d7b150dcc4e55ae4499ec7fec6ddc,
title = "Empirical Analysis of Ranking Models for an Adaptable Dataset Search",
abstract = "Currently available datasets still have a large unexplored potential for interlinking. Ranking techniques contribute to this task by scoring datasets according to the likelihood of finding entities related to those of a target dataset. Ranked datasets can be either manually selected for standalone linking discovery tasks or automatically inspected by programs that would go through the ranking looking for entity links. This work presents empirical comparisons between different ranking models and argues that different algorithms could be used depending on whether the ranking is manually or automatically handled and, also, depending on the available metadata of the datasets. Experiments indicate that ranking algorithms that performed best with nDCG do not always have the best Recall at Position k, for high recall levels. The best ranking model for the manual use case (with respect to nDCG) may need 13% more datasets for 90% of recall, i.e., instead of just a slice of 34% of the datasets at the top of the ranking, reached by the best model for the automatic use case (with respect to recall@k), it would need almost 47% of the ranking.",
keywords = "Dataset, Empirical evaluation, Entity linking, Linked Data, Ranking, Recommendation",
author = "Neves, {Angelo B.} and {de Oliveira}, {Rodrigo G.G.} and Leme, {Luiz Andr{\'e} P.Paes} and Lopes, {Giseli Rabello} and Nunes, {Bernardo P.} and Casanova, {Marco A.}",
note = "Publisher Copyright: {\textcopyright} 2018, Springer International Publishing AG, part of Springer Nature.; 15th International Conference on Extended Semantic Web Conference, ESWC 2018 ; Conference date: 03-06-2018 Through 07-06-2018",
year = "2018",
doi = "10.1007/978-3-319-93417-4_4",
language = "English",
isbn = "9783319934167",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "50--64",
editor = "Aldo Gangemi and Rapha{\"e}l Troncy and Roberto Navigli and Laura Hollink and Maria-Esther Vidal and Pascal Hitzler and Anna Tordai and Mehwish Alam",
booktitle = "The Semantic Web - 15th International Conference, ESWC 2018, Proceedings",
address = "Germany",
}