@inproceedings{f3c01e2b573a4ee0a7decc2848367cfb,
title = "Improving temporal record linkage using regression classification",
abstract = "Temporal record linkage is the process of identifying groups of records that are collected over a period of time, such as in census or voter registration databases, where records in the same group represent the same real-world entity. Such databases often contain temporal information, such as the time when a record was created or when it was modified. Unlike traditional record linkage, which considers differences between records from the same entity as errors or variations, temporal record linkage aims to capture records from entities where the attribute values are known to change over time. In this paper we propose a novel approach that extends an existing temporal approach called decay model, to categorically calculate probabilities of change for each attribute. Our novel method uses a regression-based machine learning model to predict decays for sets of attributes. Each such set of attributes has a principle attribute and support attributes, where values of the support attributes can affect the decay of the principle attribute. Our experimental results on a real US voter database show that our proposed approach results in better linkage quality compared to the decay model approach.",
keywords = "Attribute weighting, Data matching, Decay, Entity resolution, Temporal data",
author = "Yichen Hu and Qing Wang and Dinusha Vatsalan and Peter Christen",
note = "Publisher Copyright: {\textcopyright} 2017, Springer International Publishing AG.; 21st Pacific-Asia Conference on Knowledge Discovery and Data Mining, PAKDD 2017 ; Conference date: 23-05-2017 Through 26-05-2017",
year = "2017",
doi = "10.1007/978-3-319-57454-7_44",
language = "English",
isbn = "9783319574530",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "561--573",
editor = "Kyuseok Shim and Jae-Gil Lee and Longbing Cao and Xuemin Lin and Jinho Kim and Yang-Sae Moon",
booktitle = "Advances in Knowledge Discovery and Data Mining - 21st Pacific-Asia Conference, PAKDD 2017, Proceedings",
address = "Germany",
}