{"id":"https://openalex.org/W2052074791","doi":"https://doi.org/10.1109/bibe.2007.4375733","title":"Toward The Recognition Code Of Protein-DNA Recognition","display_name":"Toward The Recognition Code Of Protein-DNA Recognition","publication_year":2007,"publication_date":"2007-10-01","ids":{"openalex":"https://openalex.org/W2052074791","doi":"https://doi.org/10.1109/bibe.2007.4375733","mag":"2052074791"},"language":"en","primary_location":{"id":"doi:10.1109/bibe.2007.4375733","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bibe.2007.4375733","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2007 IEEE 7th International Symposium on BioInformatics and BioEngineering","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020469612","display_name":"Juan Shan","orcid":"https://orcid.org/0000-0002-2718-3164"},"institutions":[{"id":"https://openalex.org/I121980950","display_name":"Utah State University","ror":"https://ror.org/00h6set76","country_code":"US","type":"education","lineage":["https://openalex.org/I121980950"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Juan Shan","raw_affiliation_strings":["Department of Computer Science, Utah State University, Logan, UT, USA","Utah State Univ, Logan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Utah State University, Logan, UT, USA","institution_ids":["https://openalex.org/I121980950"]},{"raw_affiliation_string":"Utah State Univ, Logan","institution_ids":["https://openalex.org/I121980950"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101664515","display_name":"Yuxuan Wang","orcid":"https://orcid.org/0009-0005-3508-3736"},"institutions":[{"id":"https://openalex.org/I121980950","display_name":"Utah State University","ror":"https://ror.org/00h6set76","country_code":"US","type":"education","lineage":["https://openalex.org/I121980950"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yuxuan Wang","raw_affiliation_strings":["Department of Computer Science, Utah State University, Logan, UT, USA","Utah State Univ, Logan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Utah State University, Logan, UT, USA","institution_ids":["https://openalex.org/I121980950"]},{"raw_affiliation_string":"Utah State Univ, Logan","institution_ids":["https://openalex.org/I121980950"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100871727","display_name":"Changhui Yan","orcid":"https://orcid.org/0000-0003-3048-8628"},"institutions":[{"id":"https://openalex.org/I121980950","display_name":"Utah State University","ror":"https://ror.org/00h6set76","country_code":"US","type":"education","lineage":["https://openalex.org/I121980950"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Changhui Yan","raw_affiliation_strings":["Department of Computer Science, Utah State University, Logan, UT, USA","Utah State Univ, Logan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Utah State University, Logan, UT, USA","institution_ids":["https://openalex.org/I121980950"]},{"raw_affiliation_string":"Utah State Univ, Logan","institution_ids":["https://openalex.org/I121980950"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5020469612"],"corresponding_institution_ids":["https://openalex.org/I121980950"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.09950821,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":93,"max":95},"biblio":{"volume":"7","issue":null,"first_page":"1290","last_page":"1293"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/amino-acid","display_name":"Amino acid","score":0.5927115082740784},{"id":"https://openalex.org/keywords/purine-metabolism","display_name":"Purine metabolism","score":0.5780165195465088},{"id":"https://openalex.org/keywords/dna","display_name":"DNA","score":0.5535005927085876},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5501287579536438},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.5312083959579468},{"id":"https://openalex.org/keywords/genetic-code","display_name":"Genetic code","score":0.48617929220199585},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.46855196356773376},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4463396370410919},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.39470577239990234},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3209090232849121},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.29154646396636963},{"id":"https://openalex.org/keywords/biochemistry","display_name":"Biochemistry","score":0.28507137298583984},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.2285677194595337},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.15493643283843994}],"concepts":[{"id":"https://openalex.org/C515207424","wikidata":"https://www.wikidata.org/wiki/Q8066","display_name":"Amino acid","level":2,"score":0.5927115082740784},{"id":"https://openalex.org/C169586020","wikidata":"https://www.wikidata.org/wiki/Q3780159","display_name":"Purine metabolism","level":3,"score":0.5780165195465088},{"id":"https://openalex.org/C552990157","wikidata":"https://www.wikidata.org/wiki/Q7430","display_name":"DNA","level":2,"score":0.5535005927085876},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5501287579536438},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.5312083959579468},{"id":"https://openalex.org/C10853874","wikidata":"https://www.wikidata.org/wiki/Q180618","display_name":"Genetic code","level":3,"score":0.48617929220199585},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.46855196356773376},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4463396370410919},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39470577239990234},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3209090232849121},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.29154646396636963},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.28507137298583984},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.2285677194595337},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.15493643283843994},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C181199279","wikidata":"https://www.wikidata.org/wiki/Q8047","display_name":"Enzyme","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bibe.2007.4375733","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bibe.2007.4375733","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2007 IEEE 7th International Symposium on BioInformatics and BioEngineering","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W1491553314","https://openalex.org/W1979558004","https://openalex.org/W1986586522","https://openalex.org/W1993006141","https://openalex.org/W1999755087","https://openalex.org/W2017727500","https://openalex.org/W2032975481","https://openalex.org/W2048241051","https://openalex.org/W2057664120","https://openalex.org/W2061307445","https://openalex.org/W2063643370","https://openalex.org/W2067007345","https://openalex.org/W2087887622","https://openalex.org/W2102154371","https://openalex.org/W2107432340","https://openalex.org/W2110562802","https://openalex.org/W2112574017","https://openalex.org/W2115694019","https://openalex.org/W2130479394","https://openalex.org/W2137154596","https://openalex.org/W2147236517","https://openalex.org/W2148603752","https://openalex.org/W2154447604","https://openalex.org/W2169837652","https://openalex.org/W4211206335"],"related_works":["https://openalex.org/W97567589","https://openalex.org/W2080601739","https://openalex.org/W3020887404","https://openalex.org/W2102971391","https://openalex.org/W2064088083","https://openalex.org/W1982081746","https://openalex.org/W4401213142","https://openalex.org/W1968879131","https://openalex.org/W2360347211","https://openalex.org/W168348071"],"abstract_inverted_index":{"Discovering":[0],"the":[1,23,35,44,62,89,99,106,129,142,149],"\"recognition":[2,150],"code\"":[3,151],"governing":[4],"protein-DNA":[5,153],"interaction":[6],"has":[7],"been":[8],"an":[9,137],"important":[10],"topic":[11],"for":[12,88],"decades":[13],"in":[14,127],"bioinformatics.":[15],"While":[16],"other":[17],"studies":[18],"have":[19],"focused":[20],"on":[21],"analyzing":[22],"frequency":[24],"of":[25,40,46,64,91,101,131,152],"amino":[26,47,52,102,138],"acid-base":[27,48,103],"contacts,":[28],"this":[29],"study":[30],"here":[31],"attempts":[32],"to":[33,60,86,97],"discover":[34],"structural":[36,75],"and":[37,76,81],"physicochemical":[38,77],"features":[39,78,92,109,144],"proteins":[41,80],"that":[42,54,69,93,136],"determine":[43],"specificity":[45,100],"contacts.":[49,71,104,140],"For":[50],"each":[51],"acid":[53,139],"contacts":[55],"with":[56,124],"DNA,":[57],"we":[58],"attempt":[59],"predict":[61,98],"type":[63,130],"bases":[65],"(purines":[66,133],"or":[67,134],"pyrimidines)":[68,135],"it":[70],"We":[72],"extract":[73],"8":[74],"from":[79],"use":[82],"a":[83,115],"bottom-up":[84],"approach":[85],"search":[87],"combination":[90],"can":[94,120],"be":[95],"used":[96],"In":[105],"end,":[107],"4":[108],"are":[110],"selected.":[111],"Using":[112],"these":[113],"features,":[114],"support":[116],"vector":[117],"machine":[118],"method":[119],"achieve":[121],"67.1%":[122],"accuracy":[123],"0.329":[125],"MCC":[126],"predicting":[128],"base":[132],"Analyzing":[141],"selected":[143],"will":[145],"provide":[146],"insights":[147],"into":[148],"interaction.":[154]},"counts_by_year":[{"year":2021,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
