@inproceedings{9b6a17518a3b442291d4c25525de989a,
title = "Hashing-based distributed multi-party blocking for privacy-preserving record linkage",
abstract = "In many application domains organizations require information from multiple sources to be integrated. Due to privacy and confidentiality concerns often these organizations are not willing or allowed to reveal their sensitive and personal data to other database owners, and to any external party. This has led to the emerging research discipline of privacy-preserving record linkage (PPRL). We propose a novel blocking approach for multi-party PPRL to efficiently and effectively prune the record sets that are unlikely to match. Our approach allows each database owner to perform blocking independently except for the initial agreement of parameter settings and a final central hashing-based clustering. We provide an analysis of our technique in terms of complexity, quality, and privacy, and conduct an empirical study with large datasets. The results show that our approach is scalable with the size of the datasets and the number of parties, while providing better quality and privacy than previous multi-party private blocking approaches.",
keywords = "Bloom filters, Clustering, Locality sensitive hashing",
author = "Thilina Ranbaduge and Dinusha Vatsalan and Peter Christen and Vassilios Verykios",
note = "Publisher Copyright: {\textcopyright} Springer International Publishing Switzerland 2016.; 20th Pacific-Asia Conference on Advances in Knowledge Discovery and Data Mining, PAKDD 2016 ; Conference date: 19-04-2016 Through 22-04-2016",
year = "2016",
doi = "10.1007/978-3-319-31750-2_33",
language = "English",
isbn = "9783319317496",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "415--427",
editor = "James Bailey and Latifur Khan and Takashi Washio and Gillian Dobbie and Huang, {Joshua Zhexue} and Ruili Wang",
booktitle = "Advances in Knowledge Discovery and Data Mining - 20th Pacific-Asia Conference, PAKDD 2016, Proceedings",
address = "Germany",
}