When seeking for small local patterns it is very intricate to distinguish between incidental agglomeration of noisy points and true local patterns. We propose a new approach that addresses this problem by exploiting temporal information which is contained in most business data sets. The algorithm enables the detection of local patterns in noisy data sets more reliable compared to the case when the temporal information is ignored. This is achieved by making use of the fact that noise does not reproduce its incidental structure but even small patterns do. In particular, we developed a method to track clusters over time based on an optimal match of data partitions between time periods.
@InProceedings{hoppner_et_al:DagSemProc.07181.9, author = {H\"{o}ppner, Frank and B\"{o}ttcher, Mirko}, title = {{Reliably Capture Local Clusters in Noisy Domains From Parallel Universes}}, booktitle = {Parallel Universes and Local Patterns}, pages = {1--2}, series = {Dagstuhl Seminar Proceedings (DagSemProc)}, ISSN = {1862-4405}, year = {2007}, volume = {7181}, editor = {Michael R. Berthold and Katharina Morik and Arno Siebes}, publisher = {Schloss Dagstuhl -- Leibniz-Zentrum f{\"u}r Informatik}, address = {Dagstuhl, Germany}, URL = {https://drops.dagstuhl.de/entities/document/10.4230/DagSemProc.07181.9}, URN = {urn:nbn:de:0030-drops-12617}, doi = {10.4230/DagSemProc.07181.9}, annote = {Keywords: Local pattern, time, parallel universe} }
Feedback for Dagstuhl Publishing