{"id":"https://openalex.org/W7131248149","doi":"https://doi.org/10.48550/arxiv.2602.18479","title":"AgentCAT: An LLM Agent for Extracting and Analyzing Catalytic Reaction Data from Chemical Engineering Literature","display_name":"AgentCAT: An LLM Agent for Extracting and Analyzing Catalytic Reaction Data from Chemical Engineering Literature","publication_year":2026,"publication_date":"2026-02-10","ids":{"openalex":"https://openalex.org/W7131248149","doi":"https://doi.org/10.48550/arxiv.2602.18479"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.18479","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126662127","display_name":"Wei Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yang, Wei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126742303","display_name":"Zihao Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Zihao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126659774","display_name":"Tao Tan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tan, Tao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126678244","display_name":"Xiao Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Xiao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126745076","display_name":"Hong Xie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xie, Hong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126731952","display_name":"Lulu Li Xin Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Lulu Li Xin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053948087","display_name":"Jianyu Han","orcid":"https://orcid.org/0000-0001-5248-376X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Jianyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126708731","display_name":"Defu Lian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lian, Defu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5027826060","display_name":"Mao Ye","orcid":"https://orcid.org/0000-0002-9584-9140"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ye, Mao","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5126662127"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.6942999958992004,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.6942999958992004,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12112","display_name":"Ammonia Synthesis and Nitrogen Reduction","score":0.018799999728798866,"subfield":{"id":"https://openalex.org/subfields/1503","display_name":"Catalysis"},"field":{"id":"https://openalex.org/fields/15","display_name":"Chemical Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10495","display_name":"Catalysts for Methane Reforming","score":0.009399999864399433,"subfield":{"id":"https://openalex.org/subfields/1503","display_name":"Catalysis"},"field":{"id":"https://openalex.org/fields/15","display_name":"Chemical Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/correctness","display_name":"Correctness","score":0.646399974822998},{"id":"https://openalex.org/keywords/abstraction","display_name":"Abstraction","score":0.5116000175476074},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.45399999618530273},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.4122999906539917},{"id":"https://openalex.org/keywords/knowledge-extraction","display_name":"Knowledge extraction","score":0.3928999900817871},{"id":"https://openalex.org/keywords/dependency-graph","display_name":"Dependency graph","score":0.37529999017715454},{"id":"https://openalex.org/keywords/data-visualization","display_name":"Data visualization","score":0.3714999854564667},{"id":"https://openalex.org/keywords/fluid-catalytic-cracking","display_name":"Fluid catalytic cracking","score":0.3463999927043915},{"id":"https://openalex.org/keywords/data-structure","display_name":"Data structure","score":0.33970001339912415}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7337999939918518},{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.646399974822998},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.5116000175476074},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.45399999618530273},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.4122999906539917},{"id":"https://openalex.org/C120567893","wikidata":"https://www.wikidata.org/wiki/Q1582085","display_name":"Knowledge extraction","level":2,"score":0.3928999900817871},{"id":"https://openalex.org/C16311509","wikidata":"https://www.wikidata.org/wiki/Q4148050","display_name":"Dependency graph","level":3,"score":0.37529999017715454},{"id":"https://openalex.org/C172367668","wikidata":"https://www.wikidata.org/wiki/Q6504956","display_name":"Data visualization","level":3,"score":0.3714999854564667},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.352400004863739},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3513999879360199},{"id":"https://openalex.org/C31052017","wikidata":"https://www.wikidata.org/wiki/Q900812","display_name":"Fluid catalytic cracking","level":3,"score":0.3463999927043915},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.34540000557899475},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.33970001339912415},{"id":"https://openalex.org/C19768560","wikidata":"https://www.wikidata.org/wiki/Q320727","display_name":"Dependency (UML)","level":2,"score":0.3368000090122223},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.33169999718666077},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.32749998569488525},{"id":"https://openalex.org/C198134878","wikidata":"https://www.wikidata.org/wiki/Q2667887","display_name":"Chemical reaction engineering","level":3,"score":0.3151000142097473},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.302700012922287},{"id":"https://openalex.org/C76363472","wikidata":"https://www.wikidata.org/wiki/Q1437394","display_name":"Formal concept analysis","level":2,"score":0.29910001158714294},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.29260000586509705},{"id":"https://openalex.org/C148230440","wikidata":"https://www.wikidata.org/wiki/Q1172264","display_name":"Datalog","level":2,"score":0.2854999899864197},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.2849000096321106},{"id":"https://openalex.org/C52146309","wikidata":"https://www.wikidata.org/wiki/Q7431116","display_name":"Schema (genetic algorithms)","level":2,"score":0.28220000863075256},{"id":"https://openalex.org/C174998907","wikidata":"https://www.wikidata.org/wiki/Q357662","display_name":"Work in process","level":2,"score":0.2784000039100647},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.26429998874664307},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2632000148296356},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.26260000467300415},{"id":"https://openalex.org/C84685590","wikidata":"https://www.wikidata.org/wiki/Q1540472","display_name":"Knowledge engineering","level":2,"score":0.2567000091075897},{"id":"https://openalex.org/C175801342","wikidata":"https://www.wikidata.org/wiki/Q1988917","display_name":"Data analysis","level":2,"score":0.25099998712539673},{"id":"https://openalex.org/C2777466982","wikidata":"https://www.wikidata.org/wiki/Q5227287","display_name":"Data extraction","level":3,"score":0.2506999969482422}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.18479","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.18479","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.18479","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.18479","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"This":[0,83,129],"paper":[1],"presents":[2,64],"a":[3,65,164,181,205],"large":[4],"language":[5,25,51],"model":[6],"(LLM)":[7],"agent":[8],"named":[9],"AgentCAT,":[10],"which":[11],"extracts":[12],"and":[13,48,68,94,139,155,196,202,213],"analyzes":[14],"catalytic":[15,73,107,115],"reaction":[16,74,116,122],"data":[17,42,54,75,117,142,174],"from":[18,176],"chemical":[19,45,177,228],"engineering":[20,46,178,229],"papers,":[21],"%and":[22],"supports":[23,210],"natural":[24,50],"based":[26,52],"interactive":[27,53],"analysis":[28,55,70],"of":[29,71,141,160,234],"the":[30,40,60,72,87,105,137,216,232],"extracted":[31],"data.":[32],"AgentCAT":[33,62,151],"serves":[34],"as":[35,144,146],"an":[36,79,223],"alternative":[37],"to":[38,59,101,110,120,135],"overcome":[39],"long-standing":[41],"bottleneck":[43],"in":[44,78,95,114],"field,":[47],"its":[49],"functionality":[56],"is":[57],"friendly":[58],"community.":[61],"also":[63],"formal":[66],"abstraction":[67,84],"challenge":[69,154],"extraction":[76,166,175],"task":[77],"artificial":[80,88],"intelligence-friendly":[81],"manner.":[82],"would":[85,97],"help":[86],"intelligence":[89],"community":[90],"understand":[91],"this":[92,153],"problem":[93],"turn":[96],"attract":[98],"more":[99],"attention":[100],"address":[102],"it.":[103],"Technically,":[104],"complex":[106],"process":[108,200],"leads":[109],"complicated":[111],"dependency":[112,130],"structure":[113,131],"with":[118,168,194],"respect":[119],"elementary":[121],"steps,":[123],"molecular":[124],"behaviors,":[125],"measurement":[126],"evidence,":[127,195],"etc.":[128],"makes":[132,157],"it":[133,156],"challenging":[134],"guarantee":[136],"correctness":[138],"completeness":[140],"extraction,":[143],"well":[145],"representing":[147],"them":[148],"for":[149,219],"analysis.":[150],"addresses":[152],"four":[158],"folds":[159],"technical":[161],"contributions:":[162],"(1)":[163],"schema-governed":[165],"pipeline":[167],"progressive":[169],"schema":[170],"evolution,":[171],"enabling":[172],"robust":[173],"papers;":[179],"(2)":[180],"dependency-aware":[182],"reaction-network":[183],"knowledge":[184],"graph":[185,218],"that":[186,209],"links":[187],"catalysts/active":[188],"sites,":[189],"synthesis-derived":[190],"descriptors,":[191],"mechanistic":[192],"claims":[193],"macroscopic":[197],"outcomes,":[198],"preserving":[199],"coupling":[201],"traceability;":[203],"(3)":[204],"general":[206],"querying":[207],"module":[208],"natural-language":[211],"exploration":[212],"visualization":[214],"over":[215],"constructed":[217],"cross-paper":[220],"analysis;":[221],"(4)":[222],"evaluation":[224],"on":[225],"$\\sim$800":[226],"peer-reviewed":[227],"publications":[230],"demonstrating":[231],"effectiveness":[233],"AgentCAT.":[235]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-25T00:00:00"}
