@inproceedings{b8424286406b415c93ed38f32ea68953,
title = "A distance-based feature-encoding technique for protein sequence classification in bioinformatics",
abstract = "Bioinformatics has been emerging as a new research dimension since the last century by combining computer science and biology techniques for the automatic analysis of biological sequence data. The volume of the biological data gathered under different sequencing projects is increasing exponentially. These sequences contain extremely important information about genes, their structure and function. Computational techniques which involve machine learning and pattern recognition are becoming very useful on Bioinformatics data like DNA and protein. Protein classification into different groups could be used for knowing the structure or the function of unknown protein sequence. The process of classifying protein amino acid sequences into a family/superfamily is a very complex problem. However, from among other major issues in a protein classification, the critical one is an accurate representation of amino acid sequence during the feature extraction. In this work, we have proposed a distance-based feature-encoding method; the proposed technique has been tested with different classifiers, which have shown better results than the previously available techniques for superfamily classification of protein sequences. The maximum average classification accuracy obtained was 91.2%. The dataset used in the experiments was taken from the well known UniProtKB protein database.",
keywords = "Bioinformatics, Data mining, Feature-encoding, Protein classification, Superfamily",
author = "Iqbal, {Muhammad Javed} and Ibrahima Faye and Said, {Abas Md} and Samir, {Brahim Belhaouari}",
year = "2013",
doi = "10.1109/CyberneticsCom.2013.6865770",
language = "English",
isbn = "9781467360531",
series = "Proceeding - IEEE CYBERNETICSCOM 2013: IEEE International Conference on Computational Intelligence and Cybernetics",
publisher = "IEEE Computer Society",
pages = "1--5",
booktitle = "Proceeding - IEEE CYBERNETICSCOM 2013",
address = "United States",
note = "2nd IEEE International Conference on Computational Intelligence and Cybernetics, IEEE CYBERNETICSCOM 2013 ; Conference date: 03-12-2013 Through 04-12-2013",
}