@inproceedings{e908dfdb799e44409ee6e74ef6fca6b2,
title = "A protein classification method based on latent semantic analysis",
abstract = "In this paper a new method that uses Latent Semantic Analysis (LSA) to denote a protein sequence is proposed for researching the protein classification problem. A protein is vectorized according to its content of biological words: patterns and motifs, which are generated by utilizing TEIRESIAS algorithm and MEME/MAST system respectively. More precise description vectors of proteins are obtained through employing LSA. Those vectors are used to classify proteins combined with the Support Vector Machine (SVM). Experiments of family-level protein classification on Structural Classification of Proteins database show that the performance of this method is better than that of the other state-of-the-arts methods.",
author = "Yuan Yongsheng and Lin Lei and Dong Qiwen and Wang Xiaolong and Li Minghui",
year = "2005",
language = "英语",
isbn = "0780387406",
series = "Annual International Conference of the IEEE Engineering in Medicine and Biology - Proceedings",
pages = "7738--7741",
booktitle = "Proceedings of the 2005 27th Annual International Conference of the Engineering in Medicine and Biology Society, IEEE-EMBS 2005",
note = "2005 27th Annual International Conference of the Engineering in Medicine and Biology Society, IEEE-EMBS 2005 ; Conference date: 01-09-2005 Through 04-09-2005",
}