@inproceedings{35b64fec28f146bb89a0322ec26e9005,
title = "Feature grouping and selection over an undirected graph",
abstract = "High-dimensional regression/classification continues to be an important and challenging problem, especially when features are highly correlated. Feature selection, combined with additional structure information on the features has been considered to be promising in promoting regression/classification performance. Graph-guided fused lasso (GFlasso) has recently been proposed to facilitate feature selection and graph structure exploitation, when features exhibit certain graph structures. However, the formulation in GFlasso relies on pairwise sample correlations to perform feature grouping, which could introduce additional estimation bias. In this paper, we propose three new feature grouping and selection methods to resolve this issue. The first method employs a convex function to penalize the pairwise l∞ norm of connected regression/classification coefficients, achieving simultaneous feature grouping and selection. The second method improves the first one by utilizing a non-convex function to reduce the estimation bias. The third one is the extension of the second method using a truncated l 1 regularization to further reduce the estimation bias. The proposed methods combine feature grouping and feature selection to enhance estimation accuracy. We employ the alternating direction method of multipliers (ADMM) and difference of convex functions (DC) programming to solve the proposed formulations. Our experimental results on synthetic data and two real datasets demonstrate the effectiveness of the proposed methods.",
keywords = "classification, feature grouping, feature selection, l regularization, regression, undirected graph",
author = "Sen Yang and Lei Yuan and Ying-Cheng Lai and Xiaotong Shen and Jieping Ye",
year = "2012",
doi = "10.1145/2339530.2339675",
language = "English (US)",
isbn = "9781450314626",
series = "Proceedings of the ACM SIGKDD International Conference on Knowledge Discovery and Data Mining",
pages = "922--930",
booktitle = "KDD'12 - 18th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining",
note = "18th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, KDD 2012 ; Conference date: 12-08-2012 Through 16-08-2012",
}