@article{open1665, volume = {105}, number = {4}, month = {April}, author = {Bharat Panwar and G.P.S. Raghava}, note = {Copyright of this article belongs to Elsevier.}, title = {Identification of protein-interacting nucleotides in a RNA sequence using composition profile of tri-nucleotides.}, publisher = {Elsevier}, year = {2015}, journal = {Genomics}, pages = {197--203}, keywords = {Protein-interacting nucleotide (PIN); Binary profile of patterns (BPP); Tri-nucleotide composition profile of patterns (TNCPP); SVM; Prediction; RNApin}, url = {http://crdd.osdd.net/open/1665/}, abstract = {The RNA-protein interactions play a diverse role in the cells, thus identification of RNA-protein interface is essential for the biologist to understand their function. In the past, several methods have been developed for predicting RNA interacting residues in proteins, but limited efforts have been made for the identification of protein-interacting nucleotides in RNAs. In order to discriminate protein-interacting and non-interacting nucleotides, we used various classifiers (NaiveBayes, NaiveBayesMultinomial, BayesNet, ComplementNaiveBayes, MultilayerPerceptron, J48, SMO, RandomForest, SMO and SVM(light)) for prediction model development using various features and achieved highest 83.92\% sensitivity, 84.82 specificity, 84.62\% accuracy and 0.62 Matthew's correlation coefficient by SVM(light) based models. We observed that certain tri-nucleotides like ACA, ACC, AGA, CAC, CCA, GAG, UGA, and UUU preferred in protein-interaction. All the models have been developed using a non-redundant dataset and are evaluated using five-fold cross validation technique. A web-server called RNApin has been developed for the scientific community (http://crdd.osdd.net/raghava/rnapin/).} }