{"id":"https://openalex.org/W7155192359","doi":"https://doi.org/10.1093/bioinformatics/btag194","title":"Spark: sparse hierarchical energy minimization for scalable prediction of RNA pseudoknots","display_name":"Spark: sparse hierarchical energy minimization for scalable prediction of RNA pseudoknots","publication_year":2026,"publication_date":"2026-04-18","ids":{"openalex":"https://openalex.org/W7155192359","doi":"https://doi.org/10.1093/bioinformatics/btag194","pmid":"https://pubmed.ncbi.nlm.nih.gov/42015361"},"language":"en","primary_location":{"id":"doi:10.1093/bioinformatics/btag194","is_oa":true,"landing_page_url":"https://doi.org/10.1093/bioinformatics/btag194","pdf_url":null,"source":{"id":"https://openalex.org/S52395412","display_name":"Bioinformatics","issn_l":"1367-4803","issn":["1367-4803","1367-4811"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1093/bioinformatics/btag194","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5032834665","display_name":"Mateo Gray","orcid":"https://orcid.org/0000-0001-7143-1367"},"institutions":[{"id":"https://openalex.org/I154425047","display_name":"University of Alberta","ror":"https://ror.org/0160cpw27","country_code":"CA","type":"education","lineage":["https://openalex.org/I154425047"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Mateo Gray","raw_affiliation_strings":["Department of Biomedical Engineering, University of Alberta, Edmonton, Alberta, T6G 2R3, Canada"],"raw_orcid":"https://orcid.org/0000-0001-7143-1367","affiliations":[{"raw_affiliation_string":"Department of Biomedical Engineering, University of Alberta, Edmonton, Alberta, T6G 2R3, Canada","institution_ids":["https://openalex.org/I154425047"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103135268","display_name":"Sebastian Will","orcid":"https://orcid.org/0000-0002-2376-9205"},"institutions":[{"id":"https://openalex.org/I142476485","display_name":"\u00c9cole Polytechnique","ror":"https://ror.org/05hy3tk52","country_code":"FR","type":"education","lineage":["https://openalex.org/I142476485","https://openalex.org/I4210145102"]},{"id":"https://openalex.org/I4210139461","display_name":"Laboratoire d'Informatique de l'\u00c9cole Polytechnique","ror":"https://ror.org/04afed728","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I142476485","https://openalex.org/I4210139461","https://openalex.org/I4210145102","https://openalex.org/I4210159245"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Sebastian Will","raw_affiliation_strings":["Laboratoire d\u2019informatique de l\u2019\u00c9cole polytechnique (LIX), Institut Polytechnique de Paris, 91120 Palaiseau, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Laboratoire d\u2019informatique de l\u2019\u00c9cole polytechnique (LIX), Institut Polytechnique de Paris, 91120 Palaiseau, France","institution_ids":["https://openalex.org/I4210139461","https://openalex.org/I142476485"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5005818804","display_name":"Hosna Jabbari","orcid":"https://orcid.org/0000-0002-7155-2297"},"institutions":[{"id":"https://openalex.org/I154425047","display_name":"University of Alberta","ror":"https://ror.org/0160cpw27","country_code":"CA","type":"education","lineage":["https://openalex.org/I154425047"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Hosna Jabbari","raw_affiliation_strings":["Department of Biomedical Engineering, University of Alberta, Edmonton, Alberta, T6G 2R3, Canada"],"raw_orcid":"https://orcid.org/0000-0002-7155-2297","affiliations":[{"raw_affiliation_string":"Department of Biomedical Engineering, University of Alberta, Edmonton, Alberta, T6G 2R3, Canada","institution_ids":["https://openalex.org/I154425047"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":3618,"currency":"USD","value_usd":3618},"apc_paid":{"value":3618,"currency":"USD","value_usd":3618},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.59194354,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"42","issue":"5","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.8970000147819519,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.8970000147819519,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.05420000106096268,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10604","display_name":"RNA Research and Splicing","score":0.006899999920278788,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6524999737739563},{"id":"https://openalex.org/keywords/minification","display_name":"Minification","score":0.6103000044822693},{"id":"https://openalex.org/keywords/energy-minimization","display_name":"Energy minimization","score":0.5152000188827515},{"id":"https://openalex.org/keywords/energy","display_name":"Energy (signal processing)","score":0.48339998722076416},{"id":"https://openalex.org/keywords/r-package","display_name":"R package","score":0.43970000743865967}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7364000082015991},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6524999737739563},{"id":"https://openalex.org/C147764199","wikidata":"https://www.wikidata.org/wiki/Q6865248","display_name":"Minification","level":2,"score":0.6103000044822693},{"id":"https://openalex.org/C14961307","wikidata":"https://www.wikidata.org/wiki/Q5377176","display_name":"Energy minimization","level":2,"score":0.5152000188827515},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.48339998722076416},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4794999957084656},{"id":"https://openalex.org/C2984074130","wikidata":"https://www.wikidata.org/wiki/Q73539779","display_name":"R package","level":2,"score":0.43970000743865967},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.414900004863739},{"id":"https://openalex.org/C67705224","wikidata":"https://www.wikidata.org/wiki/Q11053","display_name":"RNA","level":3,"score":0.41019999980926514},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.4074999988079071},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.28369998931884766},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.2833000123500824},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.25920000672340393}],"mesh":[{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D009690","descriptor_name":"Nucleic Acid Conformation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D009690","descriptor_name":"Nucleic Acid Conformation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D012313","descriptor_name":"RNA","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":true},{"descriptor_ui":"D012313","descriptor_name":"RNA","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":true},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D013816","descriptor_name":"Thermodynamics","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D013816","descriptor_name":"Thermodynamics","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017423","descriptor_name":"Sequence Analysis, RNA","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D017423","descriptor_name":"Sequence Analysis, RNA","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D059370","descriptor_name":"RNA Folding","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D059370","descriptor_name":"RNA Folding","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":3,"locations":[{"id":"doi:10.1093/bioinformatics/btag194","is_oa":true,"landing_page_url":"https://doi.org/10.1093/bioinformatics/btag194","pdf_url":null,"source":{"id":"https://openalex.org/S52395412","display_name":"Bioinformatics","issn_l":"1367-4803","issn":["1367-4803","1367-4811"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics","raw_type":"journal-article"},{"id":"pmid:42015361","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/42015361","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics (Oxford, England)","raw_type":null},{"id":"pmh:oai:pubmedcentral.nih.gov:13171173","is_oa":true,"landing_page_url":"https://pmc.ncbi.nlm.nih.gov/articles/PMC13171173/","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Bioinformatics","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1093/bioinformatics/btag194","is_oa":true,"landing_page_url":"https://doi.org/10.1093/bioinformatics/btag194","pdf_url":null,"source":{"id":"https://openalex.org/S52395412","display_name":"Bioinformatics","issn_l":"1367-4803","issn":["1367-4803","1367-4811"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.7884083986282349,"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320334593","display_name":"Natural Sciences and Engineering Research Council of Canada","ror":"https://ror.org/01h531d29"},{"id":"https://openalex.org/F4320334601","display_name":"National Research Council Canada","ror":"https://ror.org/04mte1k06"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W1542565836","https://openalex.org/W1873547760","https://openalex.org/W1999060916","https://openalex.org/W2004945910","https://openalex.org/W2037367916","https://openalex.org/W2041882488","https://openalex.org/W2048814860","https://openalex.org/W2064714768","https://openalex.org/W2069779808","https://openalex.org/W2083479074","https://openalex.org/W2086561953","https://openalex.org/W2119185511","https://openalex.org/W2119336718","https://openalex.org/W2123241418","https://openalex.org/W2138455866","https://openalex.org/W2147459598","https://openalex.org/W2148599336","https://openalex.org/W2162224067","https://openalex.org/W2167516501","https://openalex.org/W2339509753","https://openalex.org/W2750655368","https://openalex.org/W2807635396","https://openalex.org/W4392343346","https://openalex.org/W4393951763"],"related_works":[],"abstract_inverted_index":{"MOTIVATION:":[0],"The":[1],"biological":[2,31],"functions":[3],"of":[4,38,88,162,227,259],"RNAs":[5],"are":[6,21,45,53],"tightly":[7],"connected":[8],"to":[9,17,56,71,104,189],"their":[10],"specific":[11],"RNA":[12,32,117,229,245],"structures.":[13,43,118,230],"As":[14],"experimental":[15],"techniques":[16],"determine":[18],"high-accuracy":[19],"structures":[20,125],"costly":[22],"and":[23,145,153,181,201,210,220,240,262],"time-consuming,":[24],"computational":[25],"prediction":[26,37,63,75,92,226,236],"approaches":[27],"became":[28],"indispensable":[29],"for":[30,114,137,223,242],"research;":[33],"most":[34],"notably,":[35],"the":[36,81,89,122,131,151,160,198,224,260],"minimum":[39],"free":[40],"energy":[41,135,143],"secondary":[42],"Pseudoknots":[44],"prevalent,":[46],"highly":[47],"significant":[48],"structural":[49],"motifs,":[50],"yet":[51],"they":[52],"commonly":[54],"ignored":[55],"achieve":[57],"acceptable":[58],"efficiency.":[59],"Existing":[60],"reliable":[61],"pseudoknot":[62,74,91,235],"methods":[64],"typically":[65],"have":[66],"prohibitive":[67],"complexity.":[68],"A":[69],"route":[70],"fast":[72,219],"scalable":[73],"was":[76],"suggested":[77],"with":[78,173,255],"HFold":[79,129,165],"following":[80],"hierarchical":[82,105,211],"folding":[83,212],"hypothesis.":[84],"Recent":[85],"successful":[86],"sparsification":[87,140,209],"CCJ":[90],"algorithm":[93,113],"in":[94,130,213,216,237],"Knotty":[95],"promises":[96],"a":[97,111,168,256],"further":[98],"boost":[99],"by":[100],"introducing":[101],"this":[102],"technique":[103],"folding.":[106],"RESULTS:":[107],"We":[108,158],"introduce":[109],"Spark,":[110],"sparsified":[112],"predicting":[115],"pseudoknotted":[116,228],"Spark":[119,163,175,196,214,232,248],"predicts":[120],"exactly":[121],"same":[123],"minimum-energy":[124],"as":[126,167],"its":[127],"predecessor":[128],"accurate":[132,225],"HotKnots":[133],"2.0":[134],"model":[136],"pseudoknots.":[138],"While":[139],"maintains":[141],"exact":[142],"minimization":[144],"theoretical":[146],"complexity,":[147],"it":[148],"strongly":[149],"improves":[150],"time":[152,180],"space":[154],"consumption":[155],"over":[156],"HFold.":[157,206],"benchmarked":[159],"performance":[161],"against":[164],"and,":[166],"pseudoknot-free":[169],"baseline,":[170],"RNAfold.":[171,190],"Compared":[172],"HFold,":[174],"substantially":[176],"reduces":[177],"both":[178],"run":[179,186],"memory":[182,200],"usage,":[183],"while":[184],"achieving":[185],"times":[187],"close":[188],"Across":[191],"all":[192],"tested":[193],"sequence":[194],"lengths,":[195],"used":[197],"least":[199],"consistently":[202],"ran":[203],"faster":[204],"than":[205],"CONCLUSION:":[207],"Combining":[208],"results":[215,263],"an":[217],"remarkably":[218],"memory-efficient":[221],"tool":[222],"Consequently,":[231],"practically":[233],"enables":[234],"large":[238],"scale":[239],"even":[241],"very":[243],"long":[244],"sequences.":[246],"AVAILABILITY:":[247],"software":[249,261],"is":[250],"available":[251],"on":[252,265],"Github":[253],"(https://github.com/TheCOBRALab/Spark),":[254],"permanent":[257],"archive":[258],"deposited":[264],"Zenodo":[266],"(https://doi.org/10.5281/zenodo.19073315).":[267]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-23T00:00:00"}
