@inproceedings{e605308361f141c1b42ec0c98ffeb240,
title = "A toolbox approach to flexible and efficient data mining",
abstract = "This paper describes a flexible and efficient toolbox based on the scripting language Python, capable of handling common tasks in data mining. Using either a relational database or flat files the toolbox gives the user a uniform view of a data collection. Two core features of the toolbox are caching of database queries and parallelism within a collection of independent queries. Our toolbox provides a number of routines for basic data mining tasks on top of which the user can add more functions - mainly domain and data collection dependent - for complex and time consuming data mining tasks.",
keywords = "Caching, Health data, Python, Relational database, SQL",
author = "Nielsen, {Ole M.} and Peter Christen and Markus Hegland and Tatiana Semenova and Timothy Hancock",
note = "Publisher Copyright: {\textcopyright} Springer-Verlag Berlin Heidelberg 2001.; 5th Pacific-Asia Conference on Knowledge Discovery and Data Mining, PAKDD 2001 ; Conference date: 16-04-2001 Through 18-04-2001",
year = "2001",
doi = "10.1007/3-540-45357-1_16",
language = "English",
isbn = "3540419101",
series = "Lecture Notes in Artificial Intelligence (Subseries of Lecture Notes in Computer Science)",
publisher = "Springer Verlag",
pages = "124--135",
editor = "David Cheung and Williams, {Graham J.} and Qing Li",
booktitle = "Advances in Knowledge Discovery and Data Mining - 5th Pacific-Asia Conference, PAKDD 2001, Proceedings",
address = "Germany",
}