@inproceedings{f4a48c96687a457db24f30e96a3fd0bc,
title = "A solution to the curse of dimensionality problem in pairwise scoring techniques",
abstract = "This paper provides a solution to the curse of dimensionality problem in the pairwise scoring techniques that are commonly used in bioinformatics and biometrics applications. It has been recently discovered that stacking the pairwise comparison scores between an unknown patterns and a set of known patterns can result in feature vectors with nice discriminative properties for classification. However, such technique can lead to curse of dimensionality because the vectors size is equal to the training set size. To overcome this problem, this paper shows that the pairwise score matrices possess a symmetric and diagonally dominant property that allows us to select the most relevant features independently by an FDA-like technique. Then, the paper demonstrates the capability of the technique via a protein sequence classification problem. It was found that 10-fold reduction in the number of feature dimensions and recognition time can be achieved with just 4% reduction in recognition accuracy.",
keywords = "Curse of dimensionality, Feature selection, Fisher discriminant analysis, Protein sequence analysis, Subcellular localization, Support vector machines",
author = "Mak, {Man Wai} and Kung, {Sun Yuan}",
note = "Copyright: Copyright 2020 Elsevier B.V., All rights reserved.; 13th International Conference on Neural Information Processing, ICONIP 2006 ; Conference date: 03-10-2006 Through 06-10-2006",
year = "2006",
doi = "10.1007/11893028_36",
language = "English (US)",
isbn = "3540464794",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "314--323",
booktitle = "Neural Information Processing - 13th International Conference, ICONIP 2006, Proceedings",
address = "Germany",
}