@inbook {IOPORT.05569752, author = {Ceccarelli, Michele and d'Acierno, Antonio and Facchiano, Angelo}, title = {A machine learning approach to mass spectra classification with unsupervised feature selection.}, year = {2009}, booktitle = {Computational intelligence methods for bioinformatics and biostatistics. 5th international meeting, CIBB 2008, Vietri sul Mare, Italy, October 3--4, 2008. Revised selected papers}, isbn = {978-3-642-02503-7}, pages = {242-252}, publisher = {Berlin: Springer}, doi = {10.1007/978-3-642-02504-4_22}, abstract = {Summary: Mass spectrometry spectra are recognized as a screening tool for detecting discriminatory protein patterns. Mass spectra, however, are high dimensional data and a large number of local maxima (a.k.a. peaks) have to be analyzed; to tackle this problem we have developed a three-step strategy. After data pre-processing we perform an unsupervised feature selection phase aimed at detecting salient parts of the spectra which could be useful for the subsequent classification phase. The main contribution of the paper is the development of this feature selection and extraction procedure grounded on the theory of multi-scale spaces. Then we use support vector machines for classification. Results obtained by the analysis of a data set of tumor/healthy samples allowed us to correctly classify more than 95\% of samples. ROC analysis has been also performed.}, identifier = {05569752}, }