{"id":"https://openalex.org/W6948203586","doi":"https://doi.org/10.48550/arxiv.2507.08109","title":"Audit, Alignment, and Optimization of LM-Powered Subroutines with Application to Public Comment Processing","display_name":"Audit, Alignment, and Optimization of LM-Powered Subroutines with Application to Public Comment Processing","publication_year":2025,"publication_date":"2025-07-10","ids":{"openalex":"https://openalex.org/W6948203586","doi":"https://doi.org/10.48550/arxiv.2507.08109"},"language":"en","primary_location":{"id":"doi:10.48550/arxiv.2507.08109","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2507.08109","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2507.08109","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Raab, Reilly","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Raab, Reilly","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Parker, Mike","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Parker, Mike","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Nally, Dan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nally, Dan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Montgomery, Sadie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Montgomery, Sadie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Bernat, Anastasia","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bernat, Anastasia","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Munikoti, Sai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Munikoti, Sai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Horawalavithana, Sameera","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Horawalavithana, Sameera","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T11937","display_name":"Research Data Management Practices","score":0.15160000324249268,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11937","display_name":"Research Data Management Practices","score":0.15160000324249268,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12640","display_name":"Environmental DNA in Biodiversity Studies","score":0.07109999656677246,"subfield":{"id":"https://openalex.org/subfields/2303","display_name":"Ecology"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11879","display_name":"Protist diversity and phylogeny","score":0.06589999794960022,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/subroutine","display_name":"Subroutine","score":0.8159999847412109},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.647599995136261},{"id":"https://openalex.org/keywords/audit","display_name":"Audit","score":0.5975000262260437},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.5958999991416931},{"id":"https://openalex.org/keywords/asynchronous-communication","display_name":"Asynchronous communication","score":0.588100016117096},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5356000065803528},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.39070001244544983},{"id":"https://openalex.org/keywords/automation","display_name":"Automation","score":0.3312999904155731}],"concepts":[{"id":"https://openalex.org/C96147967","wikidata":"https://www.wikidata.org/wiki/Q190686","display_name":"Subroutine","level":2,"score":0.8159999847412109},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7670999765396118},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.647599995136261},{"id":"https://openalex.org/C199521495","wikidata":"https://www.wikidata.org/wiki/Q181487","display_name":"Audit","level":2,"score":0.5975000262260437},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.5958999991416931},{"id":"https://openalex.org/C151319957","wikidata":"https://www.wikidata.org/wiki/Q752739","display_name":"Asynchronous communication","level":2,"score":0.588100016117096},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5356000065803528},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.44830000400543213},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.397599995136261},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.39070001244544983},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3880999982357025},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.3312999904155731},{"id":"https://openalex.org/C29122968","wikidata":"https://www.wikidata.org/wiki/Q1414816","display_name":"Incentive","level":2,"score":0.3100999891757965},{"id":"https://openalex.org/C59577422","wikidata":"https://www.wikidata.org/wiki/Q10265143","display_name":"False accusation","level":2,"score":0.30059999227523804},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.2915000021457672},{"id":"https://openalex.org/C71745522","wikidata":"https://www.wikidata.org/wiki/Q2476929","display_name":"Confidentiality","level":2,"score":0.28290000557899475},{"id":"https://openalex.org/C138827492","wikidata":"https://www.wikidata.org/wiki/Q6661985","display_name":"Data processing","level":2,"score":0.2732999920845032},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.27250000834465027},{"id":"https://openalex.org/C2780626000","wikidata":"https://www.wikidata.org/wiki/Q5936775","display_name":"Human-in-the-loop","level":2,"score":0.2687999904155731},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.26739999651908875},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2648000121116638},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.25429999828338623},{"id":"https://openalex.org/C195094911","wikidata":"https://www.wikidata.org/wiki/Q14167904","display_name":"Process management","level":1,"score":0.25279998779296875}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2507.08109","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2507.08109","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2507.08109","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2507.08109","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.8127201199531555}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"advent":[1],"of":[2,97,161,192,230],"language":[3],"models":[4],"(LMs)":[5],"has":[6],"the":[7,95,159,168,207,228],"potential":[8],"to":[9,17,49,93,120,131,180,198,218],"dramatically":[10],"accelerate":[11],"tasks":[12],"that":[13,85,185],"may":[14,141],"be":[15,142],"cast":[16],"text-processing;":[18],"however,":[19],"real-world":[20,146],"adoption":[21,134],"is":[22,91],"hindered":[23],"by":[24,167,209,224],"concerns":[25],"regarding":[26],"safety,":[27],"explainability,":[28],"and":[29,45,114,118,135,152,188],"bias.":[30],"How":[31],"can":[32],"we":[33,63,155,176],"responsibly":[34],"leverage":[35],"LMs":[36],"in":[37,150,158,196],"a":[38,65,129,190,199],"transparent,":[39],"auditable":[40],"manner":[41],"--":[42,83],"minimizing":[43],"risk":[44],"allowing":[46],"human":[47,89,216,225],"experts":[48,90],"focus":[50],"on":[51,122],"informed":[52],"decision-making":[53],"rather":[54],"than":[55],"data-processing":[56],"or":[57],"prompt":[58],"engineering?":[59],"In":[60,104],"this":[61,126,139,178],"work,":[62],"propose":[64],"framework":[66,127,140,179],"for":[67,77],"declaring":[68],"statically":[69],"typed,":[70],"LM-powered":[71],"subroutines":[72],"(i.e.,":[73,101,110],"callable,":[74],"function-like":[75],"procedures)":[76],"use":[78,177],"within":[79],"conventional":[80],"asynchronous":[81],"code":[82],"such":[84],"sparse":[86],"feedback":[87],"from":[88],"used":[92],"improve":[94],"performance":[96],"each":[98],"subroutine":[99],"online":[100],"during":[102,227],"use).":[103],"our":[105],"implementation,":[106],"all":[107],"LM-produced":[108],"artifacts":[109],"prompts,":[111],"inputs,":[112],"outputs,":[113],"data-dependencies)":[115],"are":[116],"recorded":[117],"exposed":[119],"audit":[121],"demand.":[123],"We":[124,204],"package":[125],"as":[128,165,222],"library":[130],"support":[132],"its":[133,211],"continued":[136],"development.":[137],"While":[138],"applicable":[143],"across":[144],"several":[145],"decision":[147],"workflows":[148],"(e.g.,":[149],"healthcare":[151],"legal":[153],"fields),":[154],"evaluate":[156,206],"it":[157],"context":[160],"public":[162,193],"comment":[163],"processing":[164],"mandated":[166],"1969":[169],"National":[170],"Environmental":[171],"Protection":[172],"Act":[173],"(NEPA):":[174],"Specifically,":[175],"develop":[181],"\"CommentNEPA,\"":[182],"an":[183],"application":[184,208],"compiles,":[186],"organizes,":[187],"summarizes":[189],"corpus":[191],"commentary":[194],"submitted":[195],"response":[197],"project":[200],"requiring":[201],"environmental":[202,232],"review.":[203],"quantitatively":[205],"comparing":[210],"outputs":[212],"(when":[213],"operating":[214],"without":[215],"feedback)":[217],"historical":[219],"``ground-truth''":[220],"data":[221],"labelled":[223],"annotators":[226],"preparation":[229],"official":[231],"impact":[233],"statements.":[234]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
