{"id":"https://openalex.org/W3045699401","doi":"https://doi.org/10.1145/3388440.3412482","title":"Structural representations of DNA regulatory substrates can enhance sequence-based algorithms by associating functional sequence variants","display_name":"Structural representations of DNA regulatory substrates can enhance sequence-based algorithms by associating functional sequence variants","publication_year":2020,"publication_date":"2020-09-21","ids":{"openalex":"https://openalex.org/W3045699401","doi":"https://doi.org/10.1145/3388440.3412482","mag":"3045699401"},"language":"en","primary_location":{"id":"doi:10.1145/3388440.3412482","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3388440.3412482","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 11th ACM International Conference on Bioinformatics, Computational Biology and Health Informatics","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2007.14922","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Jan Zrimec","orcid":null},"institutions":[{"id":"https://openalex.org/I66862912","display_name":"Chalmers University of Technology","ror":"https://ror.org/040wg7k59","country_code":"SE","type":"education","lineage":["https://openalex.org/I66862912"]}],"countries":["SE"],"is_corresponding":true,"raw_author_name":"Jan Zrimec","raw_affiliation_strings":["Chalmers University of Technology, Gothenburg, Sweden"],"affiliations":[{"raw_affiliation_string":"Chalmers University of Technology, Gothenburg, Sweden","institution_ids":["https://openalex.org/I66862912"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I66862912"],"apc_list":null,"apc_paid":null,"fwci":0.1672,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.50202395,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10222","display_name":"Genomics and Chromatin Dynamics","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.7961000204086304},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.7093999981880188},{"id":"https://openalex.org/keywords/dna","display_name":"DNA","score":0.6967999935150146},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5630999803543091},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.5533000230789185},{"id":"https://openalex.org/keywords/nucleic-acid-sequence","display_name":"Nucleic acid sequence","score":0.5408999919891357},{"id":"https://openalex.org/keywords/dna-sequencing","display_name":"DNA sequencing","score":0.5235999822616577},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.4964999854564667},{"id":"https://openalex.org/keywords/nucleotide","display_name":"Nucleotide","score":0.4684999883174896},{"id":"https://openalex.org/keywords/sequencing-by-hybridization","display_name":"Sequencing by hybridization","score":0.4643000066280365}],"concepts":[{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.7961000204086304},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.7093999981880188},{"id":"https://openalex.org/C552990157","wikidata":"https://www.wikidata.org/wiki/Q7430","display_name":"DNA","level":2,"score":0.6967999935150146},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.6674000024795532},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5630999803543091},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.5533000230789185},{"id":"https://openalex.org/C84148353","wikidata":"https://www.wikidata.org/wiki/Q863908","display_name":"Nucleic acid sequence","level":3,"score":0.5408999919891357},{"id":"https://openalex.org/C51679486","wikidata":"https://www.wikidata.org/wiki/Q380546","display_name":"DNA sequencing","level":3,"score":0.5235999822616577},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.4964999854564667},{"id":"https://openalex.org/C512185932","wikidata":"https://www.wikidata.org/wiki/Q28745","display_name":"Nucleotide","level":3,"score":0.4684999883174896},{"id":"https://openalex.org/C51064596","wikidata":"https://www.wikidata.org/wiki/Q7452482","display_name":"Sequencing by hybridization","level":5,"score":0.4643000066280365},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.4462999999523163},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.44429999589920044},{"id":"https://openalex.org/C45484198","wikidata":"https://www.wikidata.org/wiki/Q827246","display_name":"Sequence alignment","level":4,"score":0.4287000000476837},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.4253999888896942},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4047999978065491},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.39809998869895935},{"id":"https://openalex.org/C21592294","wikidata":"https://www.wikidata.org/wiki/Q3238407","display_name":"Regulatory sequence","level":4,"score":0.3718000054359436},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.36739999055862427},{"id":"https://openalex.org/C191961535","wikidata":"https://www.wikidata.org/wiki/Q2360205","display_name":"A-DNA","level":3,"score":0.36149999499320984},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.32919999957084656},{"id":"https://openalex.org/C151020129","wikidata":"https://www.wikidata.org/wiki/Q7625067","display_name":"Structural variation","level":4,"score":0.31299999356269836},{"id":"https://openalex.org/C61053724","wikidata":"https://www.wikidata.org/wiki/Q1154615","display_name":"Sequence analysis","level":3,"score":0.3052999973297119},{"id":"https://openalex.org/C501734568","wikidata":"https://www.wikidata.org/wiki/Q42918","display_name":"Mutation","level":3,"score":0.28790000081062317},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.28769999742507935},{"id":"https://openalex.org/C165864922","wikidata":"https://www.wikidata.org/wiki/Q411391","display_name":"Regulation of gene expression","level":3,"score":0.2854999899864197},{"id":"https://openalex.org/C90559484","wikidata":"https://www.wikidata.org/wiki/Q778379","display_name":"Expression (computer science)","level":2,"score":0.28049999475479126},{"id":"https://openalex.org/C5527404","wikidata":"https://www.wikidata.org/wiki/Q2357310","display_name":"Structural gene","level":4,"score":0.26989999413490295},{"id":"https://openalex.org/C186060115","wikidata":"https://www.wikidata.org/wiki/Q30336093","display_name":"Biological system","level":1,"score":0.2687999904155731},{"id":"https://openalex.org/C47701112","wikidata":"https://www.wikidata.org/wiki/Q735188","display_name":"Protein structure","level":2,"score":0.2687000036239624},{"id":"https://openalex.org/C107824862","wikidata":"https://www.wikidata.org/wiki/Q616005","display_name":"Binding site","level":2,"score":0.2667999863624573},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.26440000534057617},{"id":"https://openalex.org/C3017666073","wikidata":"https://www.wikidata.org/wiki/Q1764062","display_name":"Base sequence","level":3,"score":0.2603999972343445},{"id":"https://openalex.org/C70636015","wikidata":"https://www.wikidata.org/wiki/Q4300350","display_name":"Molecular biophysics","level":2,"score":0.25589999556541443},{"id":"https://openalex.org/C54985914","wikidata":"https://www.wikidata.org/wiki/Q1295754","display_name":"Consensus sequence","level":4,"score":0.25450000166893005}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/3388440.3412482","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3388440.3412482","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 11th ACM International Conference on Bioinformatics, Computational Biology and Health Informatics","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2007.14922","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2007.14922","pdf_url":"https://arxiv.org/pdf/2007.14922","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:research.chalmers.se:521506","is_oa":false,"landing_page_url":"https://research.chalmers.se/en/publication/521506","pdf_url":null,"source":{"id":"https://openalex.org/S4306402469","display_name":"Chalmers Research (Chalmers University of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I66862912","host_organization_name":"Chalmers University of Technology","host_organization_lineage":["https://openalex.org/I66862912"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":""}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2007.14922","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2007.14922","pdf_url":"https://arxiv.org/pdf/2007.14922","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6139265688","display_name":null,"funder_award_id":"Z2-7257","funder_id":"https://openalex.org/F4320322554","funder_display_name":"Javna Agencija za Raziskovalno Dejavnost RS"}],"funders":[{"id":"https://openalex.org/F4320322554","display_name":"Javna Agencija za Raziskovalno Dejavnost RS","ror":"https://ror.org/059bp8k51"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W1952865633","https://openalex.org/W1971811844","https://openalex.org/W1988580441","https://openalex.org/W1996852546","https://openalex.org/W2012015946","https://openalex.org/W2012627860","https://openalex.org/W2032268510","https://openalex.org/W2067924339","https://openalex.org/W2122429294","https://openalex.org/W2184652140","https://openalex.org/W2329440962","https://openalex.org/W2758955131","https://openalex.org/W2807706038","https://openalex.org/W4242702784"],"related_works":[],"abstract_inverted_index":{"The":[0,91],"nucleotide":[1,89,131,173],"sequence":[2,99,174],"representation":[3],"of":[4,73,83,113,125,140,154,167],"DNA":[5,43,56,98,126],"can":[6,53,77],"be":[7,78,185],"inadequate":[8],"for":[9],"resolving":[10],"protein-DNA":[11,74],"binding":[12,57],"sites":[13,58],"and":[14,24,45,76,145],"regulatory":[15,61],"substrates,":[16],"such":[17,188],"as":[18,105],"those":[19],"involved":[20],"in":[21,86],"gene":[22,26],"expression":[23],"horizontal":[25],"transfer.":[27],"Considering":[28],"that":[29,52,65,117,179],"sequence-like":[30],"representations":[31,51,95,158],"are":[32],"algorithmically":[33],"very":[34],"useful,":[35],"here":[36],"we":[37,143],"fused":[38],"over":[39],"60":[40],"currently":[41],"available":[42],"physicochemical":[44],"conformational":[46],"variables":[47],"into":[48],"compact":[49],"structural":[50,68,94,119,157],"encode":[54],"single":[55,88],"to":[59,80,103,111,159,164,172],"whole":[60],"regions.":[62],"We":[63,115],"find":[64],"the":[66,81,152,156,165],"main":[67],"components":[69],"reflect":[70],"key":[71],"properties":[72],"interactions":[75],"condensed":[79],"amount":[82],"information":[84],"found":[85],"a":[87,118,138,147],"position.":[90],"most":[92,168],"accurate":[93],"compress":[96],"functional":[97],"variants":[100],"by":[101],"30%":[102],"50%,":[104],"each":[106],"instance":[107],"encodes":[108],"from":[109],"tens":[110],"thousands":[112],"sequences.":[114],"show":[116],"distance":[120],"function":[121],"discriminates":[122],"among":[123],"groups":[124],"substrates":[127],"more":[128],"accurately":[129],"than":[130],"sequence-based":[132,161],"metrics.":[133],"As":[134],"this":[135],"opens":[136],"up":[137],"variety":[139],"implementation":[141],"possibilities,":[142],"develop":[144],"test":[146],"distance-based":[148],"alignment":[149],"algorithm,":[150],"demonstrating":[151],"potential":[153],"using":[155],"enhance":[160],"algorithms.":[162],"Due":[163],"bias":[166],"current":[169],"bioinformatic":[170],"methods":[171],"representations,":[175],"it":[176],"is":[177],"possible":[178],"considerable":[180],"performance":[181],"increases":[182],"might":[183],"still":[184],"achievable":[186],"with":[187],"solutions.":[189]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":1}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2020-08-03T00:00:00"}
