{"id":"https://openalex.org/W7161171256","doi":"https://doi.org/10.48550/arxiv.2605.12987","title":"Leveraging Multimodal Self-Consistency Reasoning in Coding Motivational Interviewing for Alcohol Use Reduction","display_name":"Leveraging Multimodal Self-Consistency Reasoning in Coding Motivational Interviewing for Alcohol Use Reduction","publication_year":2026,"publication_date":"2026-05-13","ids":{"openalex":"https://openalex.org/W7161171256","doi":"https://doi.org/10.48550/arxiv.2605.12987"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.12987","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.12987","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.12987","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013948381","display_name":"Guangzeng Han","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Guangzeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136158974","display_name":"James G. Murphy","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Murphy, James G.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055844549","display_name":"Benjamin O. Ladd","orcid":"https://orcid.org/0000-0003-0997-0778"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ladd, Benjamin O.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027237221","display_name":"Xiaolei Huang","orcid":"https://orcid.org/0000-0003-0478-8715"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Xiaolei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136170401","display_name":"Brian Borsari","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Borsari, Brian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.1965000033378601,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.1965000033378601,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12488","display_name":"Mental Health via Writing","score":0.15719999372959137,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10043","display_name":"Substance Abuse Treatment and Outcomes","score":0.12540000677108765,"subfield":{"id":"https://openalex.org/subfields/2713","display_name":"Epidemiology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/coding","display_name":"Coding (social sciences)","score":0.6682999730110168},{"id":"https://openalex.org/keywords/motivational-interviewing","display_name":"Motivational interviewing","score":0.6668000221252441},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.40880000591278076},{"id":"https://openalex.org/keywords/voting","display_name":"Voting","score":0.352400004863739},{"id":"https://openalex.org/keywords/interview","display_name":"Interview","score":0.3314000070095062}],"concepts":[{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.6682999730110168},{"id":"https://openalex.org/C2777016617","wikidata":"https://www.wikidata.org/wiki/Q1759158","display_name":"Motivational interviewing","level":3,"score":0.6668000221252441},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.576200008392334},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4212000072002411},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41690000891685486},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.40880000591278076},{"id":"https://openalex.org/C520049643","wikidata":"https://www.wikidata.org/wiki/Q189760","display_name":"Voting","level":3,"score":0.352400004863739},{"id":"https://openalex.org/C24845683","wikidata":"https://www.wikidata.org/wiki/Q178651","display_name":"Interview","level":2,"score":0.3314000070095062},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.323199987411499},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.30559998750686646},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.30230000615119934},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.273499995470047},{"id":"https://openalex.org/C151243789","wikidata":"https://www.wikidata.org/wiki/Q17148646","display_name":"Multiple baseline design","level":3,"score":0.26899999380111694}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.12987","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.12987","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.12987","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.12987","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.42777177691459656,"id":"https://metadata.un.org/sdg/8","display_name":"Decent work and economic growth"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"BACKGROUND:":[0],"Coding":[1],"Motivational":[2],"Interviewing":[3],"(MI)":[4],"sessions":[5,82],"is":[6],"essential":[7],"for":[8,102,107,112,119,127,201],"understanding":[9],"client":[10],"behaviors":[11],"and":[12,20,63,116,155,170,213],"predicting":[13],"outcomes,":[14],"but":[15],"it":[16,217],"requires":[17],"substantial":[18],"time":[19],"labor":[21],"from":[22,66,83],"trained":[23],"MI":[24,37,52,85,202,223],"professionals.":[25],"Recent":[26],"advances":[27],"in":[28],"audio-language":[29],"models":[30],"(ALMs)":[31],"offer":[32],"new":[33],"opportunities":[34],"to":[35,48,72,96],"automate":[36],"coding":[38,53,74],"by":[39,141],"capturing":[40],"multimodal":[41,160],"behavioral":[42],"signals.":[43],"OBJECTIVE:":[44],"This":[45],"study":[46],"aims":[47],"develop":[49],"an":[50],"automatic":[51,222],"approach":[54,162],"based":[55],"on":[56,189],"ALMs":[57,90],"that":[58,182,207],"analyzes":[59],"raw":[60],"audio":[61,86],"input":[62],"integrates":[64],"predictions":[65,138],"multiple":[67],"reasoning":[68,133],"trajectories":[69,134],"using":[70,151],"self-consistency":[71,161,195],"improve":[73],"robustness.":[75],"METHODS:":[76],"We":[77,88],"experimented":[78],"with":[79,91],"five":[80],"recorded":[81],"de-identified":[84],"tapes.":[87],"deployed":[89],"four":[92],"complementary":[93],"analytic":[94,100],"prompts":[95],"support":[97,219],"utterance-level":[98],"reasoning:":[99],"prompting":[101,106,111,118,199],"verbal":[103],"cues,":[104,109],"prosody-aware":[105],"acoustic":[108],"evidence-scoring":[110],"quantitative":[113],"hypothesis":[114],"testing,":[115],"comparative":[117],"contrastive":[120],"reasoning.":[121],"Three":[122],"stochastic":[123],"samples":[124],"were":[125,139],"drawn":[126],"each":[128],"prompt,":[129],"generating":[130],"12":[131],"independent":[132],"per":[135],"utterance.":[136],"Final":[137],"determined":[140],"majority":[142],"voting":[143],"across":[144],"all":[145],"trajectories.":[146],"RESULTS:":[147],"Performance":[148],"was":[149],"evaluated":[150],"accuracy,":[152,165],"precision,":[153,167],"recall,":[154,169],"macro-F1":[156,172],"scores.":[157],"The":[158],"proposed":[159],"achieved":[163],"52.56%":[164],"54.03%":[166],"47.45%":[168],"a":[171],"score":[173],"of":[174],"46.40%,":[175],"exceeding":[176],"baseline":[177,198],"methods.":[178],"Systematic":[179],"ablation":[180],"experiments":[181],"removed":[183],"individual":[184],"modules":[185],"consistently":[186],"degraded":[187],"performance":[188],"the":[190],"primary":[191],"metrics.":[192],"CONCLUSIONS:":[193],"Multimodal":[194],"outperforms":[196],"single-pass":[197],"approaches":[200],"coding.":[203,224],"These":[204],"findings":[205],"suggest":[206],"incorporating":[208],"both":[209],"what":[210],"clients":[211],"say":[212,216],"how":[214],"they":[215],"can":[218],"more":[220],"reliable":[221]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-15T00:00:00"}
