{"id":"https://openalex.org/W7123359432","doi":"https://doi.org/10.1145/3770854.3780178","title":"Improving Enzyme Prediction with Chemical Reaction Equations by Hypergraph-Enhanced Knowledge Graph Embeddings","display_name":"Improving Enzyme Prediction with Chemical Reaction Equations by Hypergraph-Enhanced Knowledge Graph Embeddings","publication_year":2026,"publication_date":"2026-01-08","ids":{"openalex":"https://openalex.org/W7123359432","doi":"https://doi.org/10.1145/3770854.3780178"},"language":null,"primary_location":{"id":"pmh:oai:arXiv.org:2601.05330","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2601.05330","pdf_url":"https://arxiv.org/pdf/2601.05330","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"article","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2601.05330","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5080777080","display_name":"Tengwei Song","orcid":"https://orcid.org/0000-0001-5646-7724"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Song, Tengwei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122856520","display_name":"Long Yin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yin, Long","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122865589","display_name":"Zhen Han","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Zhen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5122890850","display_name":"Zhiqiang Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Zhiqiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5080777080"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.07650971,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.4016999900341034,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.4016999900341034,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.18129999935626984,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.10700000077486038,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hypergraph","display_name":"Hypergraph","score":0.7433000206947327},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.7174000144004822},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.6251999735832214},{"id":"https://openalex.org/keywords/knowledge-graph","display_name":"Knowledge graph","score":0.5788000226020813},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.5371000170707703},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.49900001287460327},{"id":"https://openalex.org/keywords/pairwise-comparison","display_name":"Pairwise comparison","score":0.43309998512268066}],"concepts":[{"id":"https://openalex.org/C2781221856","wikidata":"https://www.wikidata.org/wiki/Q840247","display_name":"Hypergraph","level":2,"score":0.7433000206947327},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.7174000144004822},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.6251999735832214},{"id":"https://openalex.org/C2987255567","wikidata":"https://www.wikidata.org/wiki/Q33002955","display_name":"Knowledge graph","level":2,"score":0.5788000226020813},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5407999753952026},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5371000170707703},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.49900001287460327},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.4542999863624573},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.43309998512268066},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.384799987077713},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3562999963760376},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.31349998712539673},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.2971000075340271},{"id":"https://openalex.org/C177801218","wikidata":"https://www.wikidata.org/wiki/Q36534","display_name":"Chemical reaction","level":2,"score":0.28940001130104065},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.28929999470710754},{"id":"https://openalex.org/C55037315","wikidata":"https://www.wikidata.org/wiki/Q5421151","display_name":"Experimental data","level":2,"score":0.2782999873161316},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.26910001039505005},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.26600000262260437},{"id":"https://openalex.org/C88230418","wikidata":"https://www.wikidata.org/wiki/Q131476","display_name":"Graph theory","level":2,"score":0.26589998602867126},{"id":"https://openalex.org/C5655090","wikidata":"https://www.wikidata.org/wiki/Q192588","display_name":"Relational database","level":2,"score":0.26260000467300415}],"mesh":[],"locations_count":1,"locations":[{"id":"pmh:oai:arXiv.org:2601.05330","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2601.05330","pdf_url":"https://arxiv.org/pdf/2601.05330","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2601.05330","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2601.05330","pdf_url":"https://arxiv.org/pdf/2601.05330","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"score":0.6072787642478943,"id":"https://metadata.un.org/sdg/8","display_name":"Decent work and economic growth"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Predicting":[0],"enzyme-substrate":[1,22,151,208],"interactions":[2,96,209],"has":[3],"long":[4],"been":[5],"a":[6,134,178,182,198,222,228],"fundamental":[7],"problem":[8],"in":[9,157,232,240],"biochemistry":[10],"and":[11,42,48,90,102,195,215,237],"metabolic":[12],"engineering.":[13],"While":[14],"existing":[15],"methods":[16],"could":[17],"leverage":[18],"databases":[19,33],"of":[20,45,55,63,97,129,143,188,207,250],"expert-curated":[21],"pairs":[23,152],"for":[24,153,171],"models":[25,67,115],"to":[26,51,68,70,78,148,159,185,203,227,244],"learn":[27,186],"from":[28,83],"known":[29],"pair":[30],"interactions,":[31],"the":[32,61,105,189,205,212,248],"are":[34,39],"often":[35],"sparse,":[36],"i.e.,":[37,174],"there":[38],"only":[40],"limited":[41],"incomplete":[43],"examples":[44],"such":[46,137],"pairs,":[47],"also":[49],"labor-intensive":[50],"maintain.":[52],"This":[53],"lack":[54],"sufficient":[56],"training":[57],"data":[58,111],"significantly":[59],"hinders":[60],"ability":[62],"traditional":[64,114,245],"enzyme":[65,172,234],"prediction":[66,242],"generalize":[69],"unseen":[71],"interactions.":[72],"In":[73],"this":[74],"work,":[75],"we":[76,122,139,165],"try":[77],"exploit":[79],"chemical":[80,124,216],"reaction":[81,125,217],"equations":[82,126],"domain-specific":[84],"databases,":[85],"given":[86],"their":[87],"easier":[88],"accessibility":[89],"denser,":[91],"more":[92],"abundant":[93],"data.":[94],"However,":[95],"multiple":[98,193],"compounds,":[99,164],"e.g.,":[100],"educts":[101,194],"products,":[103],"with":[104,181,210,225],"same":[106],"enzymes":[107],"create":[108],"complex":[109],"relational":[110],"patterns":[112],"that":[113,138,191],"cannot":[116],"easily":[117],"capture.":[118],"To":[119],"tackle":[120],"that,":[121],"represent":[123],"as":[127],"triples":[128],"(educt,":[130],"enzyme,":[131],"product)":[132],"within":[133],"knowledge":[135,144],"graph,":[136],"can":[140],"take":[141],"advantage":[142],"graph":[145,154],"embedding":[146],"(KGE)":[147],"infer":[149],"missing":[150],"completion.":[155],"Particularly,":[156],"order":[158],"capture":[160],"intricate":[161],"relationships":[162],"among":[163],"propose":[166],"our":[167,251],"knowledge-enhanced":[168],"hypergraph":[169,179],"model":[170,184,214],"prediction,":[173],"Hyper-Enz,":[175],"which":[176],"integrates":[177],"transformer":[180],"KGE":[183],"representations":[187],"hyper-edges":[190],"involve":[192],"products.":[196],"Also,":[197],"multi-expert":[199],"paradigm":[200],"is":[201],"introduced":[202],"guide":[204],"learning":[206],"both":[211],"proposed":[213],"equations.":[218],"Experimental":[219],"results":[220],"show":[221],"significant":[223],"improvement,":[224],"up":[226],"88%":[229],"relative":[230],"improvement":[231,239],"average":[233],"retrieval":[235],"accuracy":[236],"30%":[238],"pair-level":[241],"compared":[243],"models,":[246],"demonstrating":[247],"effectiveness":[249],"approach.":[252]},"counts_by_year":[],"updated_date":"2026-04-28T14:05:53.105641","created_date":"2026-01-14T00:00:00"}
