@inproceedings{e3aa283db3ec482db5a597a30d1244bf,
title = "A probabilistic geocoding system utilising a parcel based address file",
abstract = "It is estimated that between 80% and 90% of governmental data collections contain address information, Geocoding - the process of assigning geographic coordinates to addresses - is becoming increasingly important in application areas that involve the analysis and mining of such data. In many cases, address records are captured and/or stored in a free-form or inconsistent manner. This fact complicates the task of accurately matching such addresses to spatially-annotated reference data. In this paper we describe a geocoding system that is based on a comprehensive high-quality geocoded national address database. It uses a learning address parser based on hidden Markov models to segment free-form addresses into components, and a rule-based matching engine to determine the best matches to the reference database.",
author = "Peter Christen and Alan Willmore and Tim Churches",
year = "2006",
doi = "10.1007/11677437_11",
language = "English",
isbn = "3540325476",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "130--145",
booktitle = "Data Mining",
address = "Germany",
}