{"id":"https://openalex.org/W7148781458","doi":"https://doi.org/10.48550/arxiv.2604.01529","title":"A Role-Based LLM Framework for Structured Information Extraction from Healthy Food Policies","display_name":"A Role-Based LLM Framework for Structured Information Extraction from Healthy Food Policies","publication_year":2026,"publication_date":"2026-04-02","ids":{"openalex":"https://openalex.org/W7148781458","doi":"https://doi.org/10.48550/arxiv.2604.01529"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.01529","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.01529","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.01529","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5132845372","display_name":"Congjing Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhang, Congjing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125119465","display_name":"Ruoxuan Bao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bao, Ruoxuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132885880","display_name":"Jingyu Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Jingyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132836642","display_name":"Yoav Ackerman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ackerman, Yoav","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132859732","display_name":"Shuai Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Shuai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5051316148","display_name":"Yanfang Su","orcid":"https://orcid.org/0000-0002-4526-4187"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Su, Yanfang","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5132845372"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.10409999638795853,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.10409999638795853,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12057","display_name":"Consumer Attitudes and Food Labeling","score":0.0982000008225441,"subfield":{"id":"https://openalex.org/subfields/2739","display_name":"Public Health, Environmental and Occupational Health"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.08209999650716782,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.7149999737739563},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.6790000200271606},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5774000287055969},{"id":"https://openalex.org/keywords/information-extraction","display_name":"Information extraction","score":0.36340001225471497},{"id":"https://openalex.org/keywords/food-policy","display_name":"Food policy","score":0.3294000029563904},{"id":"https://openalex.org/keywords/corporate-governance","display_name":"Corporate governance","score":0.3244999945163727}],"concepts":[{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.7149999737739563},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.6790000200271606},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6309000253677368},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5774000287055969},{"id":"https://openalex.org/C195094911","wikidata":"https://www.wikidata.org/wiki/Q14167904","display_name":"Process management","level":1,"score":0.4032999873161316},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3978999853134155},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.36340001225471497},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.33070001006126404},{"id":"https://openalex.org/C2779363069","wikidata":"https://www.wikidata.org/wiki/Q5465509","display_name":"Food policy","level":4,"score":0.3294000029563904},{"id":"https://openalex.org/C39389867","wikidata":"https://www.wikidata.org/wiki/Q380767","display_name":"Corporate governance","level":2,"score":0.3244999945163727},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32179999351501465},{"id":"https://openalex.org/C161756209","wikidata":"https://www.wikidata.org/wiki/Q613423","display_name":"Use Case Diagram","level":5,"score":0.31360000371932983},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.30640000104904175},{"id":"https://openalex.org/C2781316041","wikidata":"https://www.wikidata.org/wiki/Q1230584","display_name":"Diversity (politics)","level":2,"score":0.30160000920295715},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.2913999855518341},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.2572999894618988},{"id":"https://openalex.org/C180198813","wikidata":"https://www.wikidata.org/wiki/Q121182","display_name":"Information system","level":2,"score":0.2547999918460846},{"id":"https://openalex.org/C74893574","wikidata":"https://www.wikidata.org/wiki/Q5465532","display_name":"Food systems","level":4,"score":0.25189998745918274},{"id":"https://openalex.org/C3020707900","wikidata":"https://www.wikidata.org/wiki/Q25099819","display_name":"Healthy food","level":2,"score":0.25040000677108765}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.01529","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.01529","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.01529","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.01529","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Zero hunger","id":"https://metadata.un.org/sdg/2","score":0.6875651478767395}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Current":[0],"Large":[1],"Language":[2],"Model":[3],"(LLM)":[4],"approaches":[5],"for":[6,67,77,88,161],"information":[7],"extraction":[8],"(IE)":[9],"in":[10,151],"the":[11,32,53,118,126],"healthy":[12,122],"food":[13,85,90,123],"policy":[14,38,57,65],"domain":[15,102],"are":[16],"often":[17],"hindered":[18],"by":[19,59,99],"various":[20],"factors,":[21],"including":[22,104],"misinformation,":[23],"specifically":[24],"hallucinations,":[25],"misclassifications,":[26],"and":[27,35,69,82,110,139,158],"omissions":[28],"that":[29,51],"result":[30],"from":[31,55,125,164],"structural":[33],"diversity":[34],"inconsistency":[36],"of":[37,107],"documents.":[39],"To":[40],"address":[41],"these":[42],"limitations,":[43],"this":[44],"study":[45],"proposes":[46],"a":[47,156],"role-based":[48],"LLM":[49,64,73,84],"framework":[50,94,119,147],"automates":[52],"IE":[54,163],"unstructured":[56],"data":[58],"assigning":[60],"specialized":[61],"roles:":[62],"an":[63,72,83],"analyst":[66],"metadata":[68],"mechanism":[70],"classification,":[71],"legal":[74,80,108],"strategy":[75],"specialist":[76],"identifying":[78],"complex":[79,152],"approaches,":[81],"system":[86,91],"expert":[87,96],"categorizing":[89],"stages.":[92],"This":[93],"mimics":[95],"analysis":[97],"workflows":[98],"incorporating":[100],"structured":[101],"knowledge,":[103],"explicit":[105],"definitions":[106],"mechanisms":[109],"classification":[111],"criteria,":[112],"into":[113],"role-specific":[114],"prompts.":[115],"We":[116],"evaluate":[117],"using":[120,143],"608":[121],"policies":[124],"Healthy":[127],"Food":[128],"Policy":[129],"Project":[130],"(HFPP)":[131],"database,":[132],"comparing":[133],"its":[134],"performance":[135,150],"against":[136],"zero-shot,":[137],"few-shot,":[138],"chain-of-thought":[140],"(CoT)":[141],"baselines":[142],"Llama-3.3-70B.":[144],"Our":[145],"proposed":[146],"demonstrates":[148],"superior":[149],"reasoning":[153],"tasks,":[154],"offering":[155],"reliable":[157],"transparent":[159],"methodology":[160],"automating":[162],"health":[165],"policies.":[166]},"counts_by_year":[],"updated_date":"2026-04-04T06:15:33.020886","created_date":"2026-04-04T00:00:00"}
