{"id":"https://openalex.org/W7161717623","doi":"https://doi.org/10.48550/arxiv.2605.17254","title":"CatalyticMLLM: A Graph-Text Multimodal Large Language Model for Catalytic Materials","display_name":"CatalyticMLLM: A Graph-Text Multimodal Large Language Model for Catalytic Materials","publication_year":2026,"publication_date":"2026-05-17","ids":{"openalex":"https://openalex.org/W7161717623","doi":"https://doi.org/10.48550/arxiv.2605.17254"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.17254","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.17254","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.17254","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136455235","display_name":"Yanjie Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Yanjie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Xu, Jian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Jian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Zhang, Xu-Yao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Xu-Yao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Xiang, Shiming","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiang, Shiming","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Ran, Nian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ran, Nian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Li, Weijun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Weijun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Liu, Cheng-Lin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Cheng-Lin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.980400025844574,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.980400025844574,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10030","display_name":"Electrocatalysts for Energy Conversion","score":0.0020000000949949026,"subfield":{"id":"https://openalex.org/subfields/2105","display_name":"Renewable Energy, Sustainability and the Environment"},"field":{"id":"https://openalex.org/fields/21","display_name":"Energy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.0017000000225380063,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/property","display_name":"Property (philosophy)","score":0.7347000241279602},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.6581000089645386},{"id":"https://openalex.org/keywords/stability","display_name":"Stability (learning theory)","score":0.6128000020980835},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.5504000186920166},{"id":"https://openalex.org/keywords/inverse","display_name":"Inverse","score":0.519599974155426},{"id":"https://openalex.org/keywords/unified-model","display_name":"Unified Model","score":0.4925000071525574},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.46700000762939453}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.782800018787384},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.7347000241279602},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.6581000089645386},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.6128000020980835},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.5504000186920166},{"id":"https://openalex.org/C207467116","wikidata":"https://www.wikidata.org/wiki/Q4385666","display_name":"Inverse","level":2,"score":0.519599974155426},{"id":"https://openalex.org/C45493050","wikidata":"https://www.wikidata.org/wiki/Q7884934","display_name":"Unified Model","level":2,"score":0.4925000071525574},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.46700000762939453},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.45579999685287476},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.44290000200271606},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42719998955726624},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3587000072002411},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.3206999897956848},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.305400013923645},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.295199990272522},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2883000075817108},{"id":"https://openalex.org/C135252773","wikidata":"https://www.wikidata.org/wiki/Q1567213","display_name":"Inverse problem","level":2,"score":0.2808000147342682},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2791999876499176}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.17254","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.17254","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.17254","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.17254","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Property":[0],"prediction":[1,54,99,122,166,178],"and":[2,51,61,70,100,107,127,133,167,179],"inverse":[3,168],"structural":[4],"design":[5,169],"of":[6,41,58,77,149,174],"catalytic":[7,94,164],"materials":[8],"are":[9],"typically":[10],"modeled":[11],"as":[12],"two":[13],"independent":[14],"tasks:":[15],"the":[16,25,35,39,45,48,52,75,104,172],"former":[17],"predicts":[18],"target":[19,141],"properties":[20],"from":[21],"given":[22],"structures,":[23],"whereas":[24],"latter":[26],"generates":[27],"candidate":[28],"structures":[29,126],"according":[30],"to":[31],"desired":[32],"properties.":[33],"Although":[34],"decoupled":[36,160],"paradigm":[37,158],"facilitates":[38],"implementation":[40],"a":[42,86,145,183],"``generation--evaluation--screening''":[43],"workflow,":[44],"inconsistency":[46],"between":[47],"generative":[49],"model":[50,55,92,106],"property":[53,98,121,177],"in":[56],"terms":[57],"representation":[59,109],"spaces":[60],"training":[62],"objectives":[63],"can":[64,116],"readily":[65],"introduce":[66],"data":[67],"distribution":[68],"shifts":[69],"evaluator":[71],"bias,":[72],"thereby":[73,143],"limiting":[74],"stability":[76],"closed-loop":[78,146],"optimization.":[79],"In":[80],"this":[81,112,156],"work,":[82],"we":[83],"propose":[84],"CatalyticMLLM,":[85],"unified":[87,113,157],"graph--text":[88],"multimodal":[89,185],"large":[90],"language":[91],"for":[93],"materials,":[95],"which":[96],"integrates":[97],"\\textbf{inverse":[101],"design}":[102],"within":[103,182],"same":[105],"shared":[108],"space.":[110],"Under":[111],"framework,":[114],"CatalyticMLLM":[115],"not":[117],"only":[118],"perform":[119],"reliable":[120],"by":[123],"leveraging":[124],"three-dimensional":[125],"textual":[128],"information,":[129],"but":[130],"also":[131],"generate":[132],"screen":[134],"physically":[135],"feasible":[136],"CIF":[137],"candidates":[138],"conditioned":[139],"on":[140,162],"properties,":[142],"forming":[144],"optimization":[147],"workflow":[148],"``inverse":[150],"design--prediction--screening--redesign.''":[151],"Experimental":[152],"results":[153],"demonstrate":[154],"that":[155],"outperforms":[159],"baselines":[161],"both":[163],"relaxed-energy":[165],"tasks,":[170],"validating":[171],"effectiveness":[173],"jointly":[175],"modeling":[176],"structure":[180],"generation":[181],"single":[184],"model.":[186]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-20T00:00:00"}
