Abstract
Spatio-temporal clustering is a sub field of data mining that is increasingly gaining more scientific attention due to the advances of location-based or environmental devices that register position, time and, in some cases, other semantic attributes. This process pretends to group objects based in their spatial and temporal similarity helping to discover interesting patterns and correlations in large data sets. One of the main challenges of this area is the ability to integrate several dimensions in a general-purpose approach. In this paper, such general approach is proposed, based on an extension of the SNN (Shared Nearest Neighbor) algorithm. The 4D+SNN algorithm allows the integration of space, time and one or more semantic attributes in the clustering process. This algorithm is able to deal with different data sets and different discovery purposes as the user has the ability to weight the importance of each dimension in the discovery process. The results obtained are very promising as show interesting findings on data and open the possibility of integration of several dimensions of analysis in the clustering process.
Links
BibTeX (Download)
@inproceedings{oliveira20134d+, title = {4D+ SNN: a spatio-temporal density-based clustering approach with 4D similarity}, author = {Ricardo Oliveira and Maribel Yasmina Santos and João Moura Pires}, url = {http://dx.doi.org/10.1109/ICDMW.2013.119}, year = {2013}, date = {2013-01-01}, booktitle = {Data Mining Workshops (ICDMW), 2013 IEEE 13th International Conference on}, pages = {1045--1052}, organization = {IEEE}, abstract = {Spatio-temporal clustering is a sub field of data mining that is increasingly gaining more scientific attention due to the advances of location-based or environmental devices that register position, time and, in some cases, other semantic attributes. This process pretends to group objects based in their spatial and temporal similarity helping to discover interesting patterns and correlations in large data sets. One of the main challenges of this area is the ability to integrate several dimensions in a general-purpose approach. In this paper, such general approach is proposed, based on an extension of the SNN (Shared Nearest Neighbor) algorithm. The 4D+SNN algorithm allows the integration of space, time and one or more semantic attributes in the clustering process. This algorithm is able to deal with different data sets and different discovery purposes as the user has the ability to weight the importance of each dimension in the discovery process. The results obtained are very promising as show interesting findings on data and open the possibility of integration of several dimensions of analysis in the clustering process.}, keywords = {Clustering, Density-based Clustering, Distance Function, Spatio-temporal Clustering, Spatio-temporal Data}, pubstate = {published}, tppubtype = {inproceedings} }