@inproceedings{58122dbff5e846e09cf06e67f75039ef,
title = "Improving k-NN graph accuracy using local intrinsic dimensionality",
abstract = "The k-nearest neighbor (k-NN) graph is an important data structure for many data mining and machine learning applications. The accuracy of k-NN graphs depends on the object feature vectors, which are usually represented in high-dimensional spaces. Selecting the most important features is essential for providing compact object representations and for improving the graph accuracy. Having a compact feature vector can reduce the storage space and the computational complexity of search and learning tasks. In this paper, we propose NNWID-Descent, a similarity graph construction method that utilizes the NNF-Descent framework while integrating a new feature selection criterion, Support-Weighted Intrinsic Dimensionality, that estimates the contribution of each feature to the overall intrinsic dimensionality. Through extensive experiments on various datasets, we show that NNWID-Descent allows a significant amount of local feature vector sparsification while still preserving a reasonable level of graph accuracy.",
keywords = "Feature selection, Intrinsic dimensionality, Vector sparsification, k-nearest neighbor graph",
author = "Houle, {Michael E.} and Vincent Oria and Wali, {Arwa M.}",
note = "Publisher Copyright: {\textcopyright} 2017, Springer International Publishing AG.; 10th International Conference on Similarity Search and Applications, SISAP 2017 ; Conference date: 04-10-2017 Through 06-10-2017",
year = "2017",
doi = "10.1007/978-3-319-68474-1_8",
language = "English (US)",
isbn = "9783319684734",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "110--124",
editor = "Felix Borutta and Peer Kroger and Thomas Seidl and Christian Beecks",
booktitle = "Similarity Search and Applications - 10th International Conference, SISAP 2017, Proceedings",
address = "Germany",
}