@inproceedings{99f2111dfbe0489cb76e128bdfd915f3,
title = "Effect of data repair on mining network streams",
abstract = "Data quality issues have special implications in network data. Data glitches are propagated rapidly along pathways dictated by the hierarchy and topology of the network. In this paper, we use temporal data from a vast data network to study data glitches and their effect on network monitoring tasks such as anomaly detection. We demonstrate the consequences of cleaning the data, and develop targeted and customized cleaning strategies by exploiting the network hierarchy.",
keywords = "Big data, Data glitches, Earth mover distance, Missing values, Network analysis, Outliers",
author = "Loh, {Ji Meng} and Tamraparni Dasu",
year = "2012",
doi = "10.1109/ICDMW.2012.125",
language = "English (US)",
isbn = "9780769549255",
series = "Proceedings - 12th IEEE International Conference on Data Mining Workshops, ICDMW 2012",
pages = "226--233",
booktitle = "Proceedings - 12th IEEE International Conference on Data Mining Workshops, ICDMW 2012",
note = "12th IEEE International Conference on Data Mining Workshops, ICDMW 2012 ; Conference date: 10-12-2012 Through 10-12-2012",
}