@inproceedings{303124f7b60f4363856d7d797c488c35,
title = "Fast summarization and anonymization of multivariate big time series",
abstract = "Sequential, predominantly temporal nature of the vast amounts of big data released every day from many different sources could potentially be linked, aligned along the time and deliver new evidence for the next generation predictive systems or knowledge discovery engines. However, big data owners are reluctant to share their data due to legally binding privacy and identity protection concerns, thereby posing a major hurdle preventing shared exploitation of big data on a massive scale. Data anonymization is expected to solve this problem, yet the current approaches are limited predominantly to univariate time series generalized by aggregation or clustering to eliminate identifiable uniqueness of individual data points or patterns. For multivariate time series, uniqueness among of the combination of values or patterns across multiple dimensions is much harder to eliminate due the to exponentially growing number of unique configurations of point values across multiple dimensions. Our method implements linearly scalable asynchronous summarization of multivariate time series independently at every dimension. As a result the series retain only a small subset of defining points at different times along multiple dimensions effectively breaking up the multivariate time series into a collection of summarized univariate time series that are perturbed from the original series in terms of actual points and pattern shapes. Current implementation of the anonymizing summarization involves shape preserving greedy elimination and aggregation that supports parallel cluster processing for big data implementation.",
keywords = "anonymization, big data, multi-variate time series, parallel processing, summarization",
author = "Dymitr Ruta and Ling Cen and Ernesto Damiani",
note = "Publisher Copyright: {\textcopyright} 2015 IEEE.; 3rd IEEE International Conference on Big Data, IEEE Big Data 2015 ; Conference date: 29-10-2015 Through 01-11-2015",
year = "2015",
month = dec,
day = "22",
doi = "10.1109/BigData.2015.7363965",
language = "British English",
series = "Proceedings - 2015 IEEE International Conference on Big Data, IEEE Big Data 2015",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "1901--1904",
editor = "Feng Luo and Kemafor Ogan and Zaki, {Mohammed J.} and Laura Haas and Ooi, {Beng Chin} and Vipin Kumar and Sudarsan Rachuri and Saumyadipta Pyne and Howard Ho and Xiaohua Hu and Shipeng Yu and Hsiao, {Morris Hui-I} and Jian Li",
booktitle = "Proceedings - 2015 IEEE International Conference on Big Data, IEEE Big Data 2015",
address = "United States",
}