{"id":"https://openalex.org/W7160604215","doi":"https://doi.org/10.48550/arxiv.2605.05348","title":"Making AI Drafts Count: A Quality Threshold in Audio Description Workflows","display_name":"Making AI Drafts Count: A Quality Threshold in Audio Description Workflows","publication_year":2026,"publication_date":"2026-05-06","ids":{"openalex":"https://openalex.org/W7160604215","doi":"https://doi.org/10.48550/arxiv.2605.05348"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.05348","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.05348","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.05348","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5135681051","display_name":"Lana Do","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Do, Lana","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135672482","display_name":"Shasta Ihorn","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ihorn, Shasta","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135694262","display_name":"Charity M. Pitcher-Cooper","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pitcher-Cooper, Charity M.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5118452576","display_name":"Sanjay Mirani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mirani, Sanjay","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124886592","display_name":"Gio Jung","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jung, Gio","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135718322","display_name":"Hyunjoo Shim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shim, Hyunjoo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135680495","display_name":"Zhenzhen Qin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qin, Zhenzhen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135653808","display_name":"Kien T. Nguyen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nguyen, Kien T.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025213339","display_name":"Vassilis Athitsos","orcid":"https://orcid.org/0000-0002-1281-6168"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Athitsos, Vassilis","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5076251624","display_name":"Ilmi Yoon","orcid":"https://orcid.org/0000-0002-2418-5287"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yoon, Ilmi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13310","display_name":"Subtitles and Audiovisual Media","score":0.9785000085830688,"subfield":{"id":"https://openalex.org/subfields/1203","display_name":"Language and Linguistics"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T13310","display_name":"Subtitles and Audiovisual Media","score":0.9785000085830688,"subfield":{"id":"https://openalex.org/subfields/1203","display_name":"Language and Linguistics"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10759","display_name":"Translation Studies and Practices","score":0.00279999990016222,"subfield":{"id":"https://openalex.org/subfields/1203","display_name":"Language and Linguistics"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.002300000051036477,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.7426999807357788},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.7189000248908997},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.6596999764442444},{"id":"https://openalex.org/keywords/scratch","display_name":"Scratch","score":0.5935999751091003},{"id":"https://openalex.org/keywords/interface","display_name":"Interface (matter)","score":0.43700000643730164},{"id":"https://openalex.org/keywords/image-editing","display_name":"Image editing","score":0.4101000130176544},{"id":"https://openalex.org/keywords/window","display_name":"Window (computing)","score":0.3443000018596649},{"id":"https://openalex.org/keywords/video-editing","display_name":"Video editing","score":0.3221000134944916}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7832000255584717},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.7426999807357788},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.7189000248908997},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.6596999764442444},{"id":"https://openalex.org/C2781235140","wikidata":"https://www.wikidata.org/wiki/Q275131","display_name":"Scratch","level":2,"score":0.5935999751091003},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5022000074386597},{"id":"https://openalex.org/C113843644","wikidata":"https://www.wikidata.org/wiki/Q901882","display_name":"Interface (matter)","level":4,"score":0.43700000643730164},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.4296000003814697},{"id":"https://openalex.org/C2776674983","wikidata":"https://www.wikidata.org/wiki/Q545981","display_name":"Image editing","level":3,"score":0.4101000130176544},{"id":"https://openalex.org/C2778751112","wikidata":"https://www.wikidata.org/wiki/Q835016","display_name":"Window (computing)","level":2,"score":0.3443000018596649},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3248000144958496},{"id":"https://openalex.org/C2780310081","wikidata":"https://www.wikidata.org/wiki/Q1154312","display_name":"Video editing","level":2,"score":0.3221000134944916},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.32170000672340393},{"id":"https://openalex.org/C169900460","wikidata":"https://www.wikidata.org/wiki/Q2200417","display_name":"Cognition","level":2,"score":0.3203999996185303},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3156000077724457},{"id":"https://openalex.org/C89505385","wikidata":"https://www.wikidata.org/wiki/Q47146","display_name":"User interface","level":2,"score":0.3043999969959259},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.30169999599456787},{"id":"https://openalex.org/C2780154230","wikidata":"https://www.wikidata.org/wiki/Q513420","display_name":"Undo","level":2,"score":0.2994999885559082},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.29600000381469727},{"id":"https://openalex.org/C61641136","wikidata":"https://www.wikidata.org/wiki/Q1107019","display_name":"Cognitive load","level":3,"score":0.2912999987602234},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.2718999981880188},{"id":"https://openalex.org/C3017588708","wikidata":"https://www.wikidata.org/wiki/Q758901","display_name":"Audio visual","level":2,"score":0.2678000032901764},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.26739999651908875},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2529999911785126}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.05348","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.05348","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.05348","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.05348","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.707747220993042}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Audio":[0],"description":[1],"(AD)":[2],"narrates":[3],"visual":[4,143],"elements":[5],"in":[6],"video":[7,65],"for":[8,72,133],"blind":[9],"and":[10,31,63,67,82,109],"low-vision":[11],"audiences.":[12],"Recent":[13],"work":[14],"has":[15],"shown":[16],"that":[17,59],"giving":[18],"novice":[19],"describers":[20],"an":[21,39,55,69],"AI-generated":[22],"draft":[23,44],"to":[24,35,128,170],"start":[25],"from":[26,91,119,151],"helps":[27],"produce":[28],"higher-quality":[29],"AD":[30,56],"lowers":[32],"the":[33,47,148,171],"barrier":[34],"entry.":[36],"What":[37],"remains":[38],"open":[40],"question":[41],"is":[42,140],"how":[43],"quality":[45,131,149,167],"shapes":[46],"editing":[48,70,94],"process.":[49],"We":[50,154],"investigate":[51],"this":[52,138,156],"through":[53],"GenAD,":[54],"generation":[57],"pipeline":[58],"incorporates":[60],"accessibility":[61],"guidelines":[62],"contextual":[64],"information,":[66],"RefineAD,":[68],"interface":[71],"human":[73],"revisions.":[74],"Human-AI":[75],"contributions":[76],"are":[77],"measured":[78],"across":[79],"text,":[80],"timing,":[81],"delivery.":[83],"In":[84,114],"a":[85,129,158,166],"within-subjects":[86],"study,":[87],"we":[88],"compared":[89],"authoring":[90],"scratch":[92],"against":[93],"AI":[95,152,162],"drafts":[96,101,117],"of":[97],"varying":[98],"quality.":[99],"GenAD":[100],"cut":[102],"completion":[103],"time":[104],"by":[105],"more":[106],"than":[107,175],"half":[108],"significantly":[110],"reduced":[111],"cognitive":[112],"load.":[113],"contrast,":[115],"baseline":[116],"generated":[118],"simple,":[120],"unguided":[121],"prompts":[122],"offered":[123],"only":[124],"modest":[125],"benefits,":[126],"pointing":[127],"minimum":[130],"threshold":[132,139,168],"effectiveness.":[134],"Qualitative":[135],"findings":[136],"suggest":[137],"content-dependent;":[141],"as":[142,157],"complexity":[144],"increases,":[145],"so":[146],"does":[147],"needed":[150],"drafts.":[153],"propose":[155],"design":[159],"principle:":[160],"effective":[161],"assistance":[163],"should":[164],"clear":[165],"suited":[169],"target":[172],"content,":[173],"rather":[174],"simply":[176],"be":[177],"present.":[178]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-09T00:00:00"}
