{"id":"https://openalex.org/W2097979901","doi":"https://doi.org/10.3233/isb-2009-0395","title":"Prediction of Polyadenylation Signals in Human DNA Sequences using Nucleotide Frequencies","display_name":"Prediction of Polyadenylation Signals in Human DNA Sequences using Nucleotide Frequencies","publication_year":2009,"publication_date":"2009-01-01","ids":{"openalex":"https://openalex.org/W2097979901","doi":"https://doi.org/10.3233/isb-2009-0395","mag":"2097979901","pmid":"https://pubmed.ncbi.nlm.nih.gov/19795571"},"language":"en","primary_location":{"id":"doi:10.3233/isb-2009-0395","is_oa":false,"landing_page_url":"https://doi.org/10.3233/isb-2009-0395","pdf_url":null,"source":{"id":"https://openalex.org/S120694666","display_name":"In Silico Biology","issn_l":"1386-6338","issn":["1386-6338","1434-3207"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318577","host_organization_name":"IOS Press","host_organization_lineage":["https://openalex.org/P4310318577"],"host_organization_lineage_names":["IOS Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"In Silico Biology: Journal of Biological Systems Modeling and Multi-Scale Simulation","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5048108232","display_name":"Firoz Ahmed","orcid":"https://orcid.org/0000-0003-4702-5144"},"institutions":[{"id":"https://openalex.org/I4210147764","display_name":"Institute of Microbial Technology","ror":"https://ror.org/055rjs771","country_code":"IN","type":"facility","lineage":["https://openalex.org/I2799351866","https://openalex.org/I4210134808","https://openalex.org/I4210147764","https://openalex.org/I66760702"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Firoz Ahmed","raw_affiliation_strings":["Bioinformatics Centre, Institute of Microbial\r\t\t\t Technology, Sector 39-A, Chandigarh, India","Bioinformatics Centre, Institute of Microbial Technology, Sector 39-A, Chandigarh, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Bioinformatics Centre, Institute of Microbial\r\t\t\t Technology, Sector 39-A, Chandigarh, India","institution_ids":["https://openalex.org/I4210147764"]},{"raw_affiliation_string":"Bioinformatics Centre, Institute of Microbial Technology, Sector 39-A, Chandigarh, India","institution_ids":["https://openalex.org/I4210147764"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019181731","display_name":"Manish Kumar","orcid":"https://orcid.org/0000-0002-7936-9892"},"institutions":[{"id":"https://openalex.org/I4210147764","display_name":"Institute of Microbial Technology","ror":"https://ror.org/055rjs771","country_code":"IN","type":"facility","lineage":["https://openalex.org/I2799351866","https://openalex.org/I4210134808","https://openalex.org/I4210147764","https://openalex.org/I66760702"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Manish Kumar","raw_affiliation_strings":["Bioinformatics Centre, Institute of Microbial\r\t\t\t Technology, Sector 39-A, Chandigarh, India","Bioinformatics Centre, Institute of Microbial Technology, Sector 39-A, Chandigarh, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Bioinformatics Centre, Institute of Microbial\r\t\t\t Technology, Sector 39-A, Chandigarh, India","institution_ids":["https://openalex.org/I4210147764"]},{"raw_affiliation_string":"Bioinformatics Centre, Institute of Microbial Technology, Sector 39-A, Chandigarh, India","institution_ids":["https://openalex.org/I4210147764"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5051938893","display_name":"Gajendra P. S. Raghava","orcid":"https://orcid.org/0000-0002-8902-2876"},"institutions":[{"id":"https://openalex.org/I4210147764","display_name":"Institute of Microbial Technology","ror":"https://ror.org/055rjs771","country_code":"IN","type":"facility","lineage":["https://openalex.org/I2799351866","https://openalex.org/I4210134808","https://openalex.org/I4210147764","https://openalex.org/I66760702"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Gajendra P.S. Raghava","raw_affiliation_strings":["Bioinformatics Centre, Institute of Microbial\r\t\t\t Technology, Sector 39-A, Chandigarh, India","Bioinformatics Centre, Institute of Microbial Technology, Sector 39-A, Chandigarh, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Bioinformatics Centre, Institute of Microbial\r\t\t\t Technology, Sector 39-A, Chandigarh, India","institution_ids":["https://openalex.org/I4210147764"]},{"raw_affiliation_string":"Bioinformatics Centre, Institute of Microbial Technology, Sector 39-A, Chandigarh, India","institution_ids":["https://openalex.org/I4210147764"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5048108232"],"corresponding_institution_ids":["https://openalex.org/I4210147764"],"apc_list":null,"apc_paid":null,"fwci":1.2284,"has_fulltext":false,"cited_by_count":54,"citation_normalized_percentile":{"value":0.78607947,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"9","issue":"3","first_page":"135","last_page":"148"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9927999973297119,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/polyadenylation","display_name":"Polyadenylation","score":0.9174470901489258},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.5428067445755005},{"id":"https://openalex.org/keywords/nucleotide","display_name":"Nucleotide","score":0.5293387174606323},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.5122022032737732},{"id":"https://openalex.org/keywords/signal","display_name":"SIGNAL (programming language)","score":0.4946460425853729},{"id":"https://openalex.org/keywords/dna","display_name":"DNA","score":0.47837963700294495},{"id":"https://openalex.org/keywords/messenger-rna","display_name":"Messenger RNA","score":0.39601776003837585},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.3912937343120575},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.3790138065814972},{"id":"https://openalex.org/keywords/biological-system","display_name":"Biological system","score":0.37487006187438965},{"id":"https://openalex.org/keywords/molecular-biology","display_name":"Molecular biology","score":0.3275870084762573},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.31103086471557617},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.25439751148223877},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.12992262840270996}],"concepts":[{"id":"https://openalex.org/C142575336","wikidata":"https://www.wikidata.org/wiki/Q412148","display_name":"Polyadenylation","level":4,"score":0.9174470901489258},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.5428067445755005},{"id":"https://openalex.org/C512185932","wikidata":"https://www.wikidata.org/wiki/Q28745","display_name":"Nucleotide","level":3,"score":0.5293387174606323},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.5122022032737732},{"id":"https://openalex.org/C2779843651","wikidata":"https://www.wikidata.org/wiki/Q7390335","display_name":"SIGNAL (programming language)","level":2,"score":0.4946460425853729},{"id":"https://openalex.org/C552990157","wikidata":"https://www.wikidata.org/wiki/Q7430","display_name":"DNA","level":2,"score":0.47837963700294495},{"id":"https://openalex.org/C105580179","wikidata":"https://www.wikidata.org/wiki/Q188928","display_name":"Messenger RNA","level":3,"score":0.39601776003837585},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.3912937343120575},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.3790138065814972},{"id":"https://openalex.org/C186060115","wikidata":"https://www.wikidata.org/wiki/Q30336093","display_name":"Biological system","level":1,"score":0.37487006187438965},{"id":"https://openalex.org/C153911025","wikidata":"https://www.wikidata.org/wiki/Q7202","display_name":"Molecular biology","level":1,"score":0.3275870084762573},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.31103086471557617},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.25439751148223877},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.12992262840270996},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D001483","descriptor_name":"Base Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001483","descriptor_name":"Base Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001483","descriptor_name":"Base Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D003198","descriptor_name":"Computer Simulation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003198","descriptor_name":"Computer Simulation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003198","descriptor_name":"Computer Simulation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003854","descriptor_name":"Deoxyribonucleotides","qualifier_ui":"Q000032","qualifier_name":"analysis","is_major_topic":false},{"descriptor_ui":"D003854","descriptor_name":"Deoxyribonucleotides","qualifier_ui":"Q000032","qualifier_name":"analysis","is_major_topic":false},{"descriptor_ui":"D003854","descriptor_name":"Deoxyribonucleotides","qualifier_ui":"Q000032","qualifier_name":"analysis","is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008956","descriptor_name":"Models, Chemical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008956","descriptor_name":"Models, Chemical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008956","descriptor_name":"Models, Chemical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011061","descriptor_name":"Poly A","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D011061","descriptor_name":"Poly A","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D011061","descriptor_name":"Poly A","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D026723","descriptor_name":"Polyadenylation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D026723","descriptor_name":"Polyadenylation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D026723","descriptor_name":"Polyadenylation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.3233/isb-2009-0395","is_oa":false,"landing_page_url":"https://doi.org/10.3233/isb-2009-0395","pdf_url":null,"source":{"id":"https://openalex.org/S120694666","display_name":"In Silico Biology","issn_l":"1386-6338","issn":["1386-6338","1434-3207"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318577","host_organization_name":"IOS Press","host_organization_lineage":["https://openalex.org/P4310318577"],"host_organization_lineage_names":["IOS Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"In Silico Biology: Journal of Biological Systems Modeling and Multi-Scale Simulation","raw_type":"journal-article"},{"id":"pmid:19795571","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/19795571","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"In silico biology","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320320721","display_name":"Council of Scientific and Industrial Research, India","ror":"https://ror.org/021wm7p51"},{"id":"https://openalex.org/F4320338259","display_name":"CSIR - Institute of Microbial Technology","ror":"https://ror.org/055rjs771"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W1566430503","https://openalex.org/W1574862351","https://openalex.org/W1588920293","https://openalex.org/W1604938182","https://openalex.org/W1770412798","https://openalex.org/W1828587713","https://openalex.org/W1857325778","https://openalex.org/W1972962841","https://openalex.org/W1988904557","https://openalex.org/W1990748933","https://openalex.org/W2001334836","https://openalex.org/W2083996291","https://openalex.org/W2094931538","https://openalex.org/W2098783856","https://openalex.org/W2099350714","https://openalex.org/W2101975376","https://openalex.org/W2102023232","https://openalex.org/W2105545925","https://openalex.org/W2107323504","https://openalex.org/W2113496982","https://openalex.org/W2125175668","https://openalex.org/W2129429612","https://openalex.org/W2132927776","https://openalex.org/W2136930152","https://openalex.org/W2140006817","https://openalex.org/W2140303894","https://openalex.org/W2149369033","https://openalex.org/W2151562469","https://openalex.org/W2152882361","https://openalex.org/W2155127403","https://openalex.org/W2159541136","https://openalex.org/W2159554382","https://openalex.org/W2161257366","https://openalex.org/W2161716000","https://openalex.org/W2166187656","https://openalex.org/W2168558973","https://openalex.org/W2170003281"],"related_works":["https://openalex.org/W1976007281","https://openalex.org/W195216885","https://openalex.org/W1968152888","https://openalex.org/W2081082232","https://openalex.org/W1983255013","https://openalex.org/W2015305388","https://openalex.org/W4321790508","https://openalex.org/W2089191559","https://openalex.org/W2019349449","https://openalex.org/W1982959161"],"abstract_inverted_index":{"The":[0],"polyadenylation":[1],"signal":[2],"plays":[3],"a":[4,14,58,74,106,111,122,134,140],"key":[5],"role":[6],"in":[7,25,57],"determining":[8],"the":[9,36,81],"site":[10],"for":[11,34,53,128],"addition":[12],"of":[13,40,68,91,113,125,142],"polyadenylated":[15],"tail":[16],"to":[17],"nascent":[18],"mRNA":[19],"and":[20,38,66,80,95,101,118],"its":[21],"mutation(s)":[22],"are":[23],"reported":[24],"many":[26],"diseases.":[27],"Thus,":[28],"identifying":[29],"poly(A)":[30,55],"sites":[31],"is":[32,145],"important":[33],"understanding":[35],"regulation":[37],"stability":[39],"mRNA.":[41],"In":[42],"this":[43,69,131],"study,":[44],"Support":[45],"Vector":[46],"Machine":[47],"(SVM)":[48],"models":[49,82],"have":[50],"been":[51],"developed":[52,84,109],"predicting":[54],"signals":[56],"DNA":[59],"sequence":[60],"using":[61,97,110],"100":[62],"nucleotides,":[63],"each":[64],"upstream":[65],"downstream":[67],"signal.":[70],"Here,":[71],"we":[72],"introduced":[73],"novel":[75],"split":[76],"nucleotide":[77],"frequency":[78],"technique,":[79],"thus":[83],"achieved":[85,121,133],"maximum":[86,123],"Matthews":[87],"correlation":[88],"coefficients":[89],"(MCC)":[90],"0.58,":[92],"0.69,":[93],"0.70":[94],"0.69":[96],"mononucleotide,":[98],"dinucleotide,":[99,114],"trinucleotide,":[100],"tetranucleotide":[102,119],"frequencies,":[103,120],"respectively.":[104],"Finally,":[105],"hybrid":[107],"model":[108,132],"combination":[112],"2nd":[115],"order":[116],"dinucleotide":[117],"MCC":[124],"0.72.":[126],"Moreover,":[127],"independent":[129],"datasets":[130],"precision":[135],"ranging":[136],"from":[137],"75.8-95.7%":[138],"with":[139],"sensitivity":[141],"57%,":[143],"which":[144],"better":[146],"than":[147],"any":[148],"other":[149],"known":[150],"methods.":[151]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":8},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":5},{"year":2014,"cited_by_count":8},{"year":2013,"cited_by_count":4}],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2025-10-10T00:00:00"}
