{"id":"https://openalex.org/W4411635711","doi":"https://doi.org/10.1145/3731715.3733374","title":"LLAUS: A High-Quality Instruction-Tuned Large Vision Language Assistant for UltraSound","display_name":"LLAUS: A High-Quality Instruction-Tuned Large Vision Language Assistant for UltraSound","publication_year":2025,"publication_date":"2025-06-25","ids":{"openalex":"https://openalex.org/W4411635711","doi":"https://doi.org/10.1145/3731715.3733374"},"language":"en","primary_location":{"id":"doi:10.1145/3731715.3733374","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3731715.3733374","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100445468","display_name":"Junhao Guo","orcid":"https://orcid.org/0000-0001-7907-0260"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Junhao Guo","raw_affiliation_strings":["Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115600233","display_name":"Xuefeng Shan","orcid":"https://orcid.org/0009-0008-6011-0769"},"institutions":[{"id":"https://openalex.org/I154093214","display_name":"Xinjiang Medical University","ror":"https://ror.org/01p455v08","country_code":"CN","type":"education","lineage":["https://openalex.org/I154093214"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"XueFeng Shan","raw_affiliation_strings":["Xinjiang Medical University, Xinjiang, China"],"affiliations":[{"raw_affiliation_string":"Xinjiang Medical University, Xinjiang, China","institution_ids":["https://openalex.org/I154093214"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101477058","display_name":"Guoming Wang","orcid":"https://orcid.org/0000-0003-3131-6916"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guoming Wang","raw_affiliation_strings":["Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091714064","display_name":"Dong Chen","orcid":"https://orcid.org/0000-0002-4859-1757"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dong Chen","raw_affiliation_strings":["Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070447777","display_name":"Rongxing Lu","orcid":"https://orcid.org/0000-0001-5720-0941"},"institutions":[{"id":"https://openalex.org/I106938459","display_name":"University of New Brunswick","ror":"https://ror.org/05nkf0n29","country_code":"CA","type":"education","lineage":["https://openalex.org/I106938459"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Rongxing Lu","raw_affiliation_strings":["University of New Brunswick, Fredericton, Canada"],"affiliations":[{"raw_affiliation_string":"University of New Brunswick, Fredericton, Canada","institution_ids":["https://openalex.org/I106938459"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5063062444","display_name":"Siliang Tang","orcid":"https://orcid.org/0000-0002-7356-9711"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Siliang Tang","raw_affiliation_strings":["Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100445468"],"corresponding_institution_ids":["https://openalex.org/I76130692"],"apc_list":null,"apc_paid":null,"fwci":1.319,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.82179811,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"398","last_page":"406"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.993399977684021,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7195523977279663},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.6114039421081543},{"id":"https://openalex.org/keywords/ultrasound","display_name":"Ultrasound","score":0.448506236076355},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.32435643672943115},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.09858289361000061},{"id":"https://openalex.org/keywords/radiology","display_name":"Radiology","score":0.08561581373214722}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7195523977279663},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.6114039421081543},{"id":"https://openalex.org/C143753070","wikidata":"https://www.wikidata.org/wiki/Q162564","display_name":"Ultrasound","level":2,"score":0.448506236076355},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.32435643672943115},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.09858289361000061},{"id":"https://openalex.org/C126838900","wikidata":"https://www.wikidata.org/wiki/Q77604","display_name":"Radiology","level":1,"score":0.08561581373214722},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3731715.3733374","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3731715.3733374","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.6800000071525574,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":5,"referenced_works":["https://openalex.org/W1956340063","https://openalex.org/W2142900395","https://openalex.org/W2990138404","https://openalex.org/W6600013530","https://openalex.org/W6600459194"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"In":[0],"recent":[1],"years,":[2],"multimodal":[3,165],"large":[4],"models":[5],"in":[6,105,170],"the":[7,27,59,110,117,126],"medical":[8,71,98],"field":[9],"have":[10,137],"garnered":[11],"widespread":[12],"attention.":[13],"However,":[14],"this":[15],"focus":[16],"has":[17,74],"primarily":[18],"been":[19,75],"on":[20,158,175],"CT":[21,47],"and":[22,33,48,55,66,130,136,183],"MRI":[23,49],"imaging,":[24],"inadvertently":[25],"neglecting":[26],"needs":[28],"of":[29,112,119],"economically":[30,64],"underdeveloped":[31],"regions":[32],"specific":[34],"populations,":[35],"such":[36],"as":[37],"pregnant":[38],"women.":[39],"These":[40],"groups":[41],"are":[42],"often":[43],"unable":[44],"to":[45,51,58,94,102,108,181],"utilize":[46],"due":[50],"their":[52],"prohibitive":[53],"costs":[54],"potential":[56],"harm":[57],"body.":[60],"Meanwhile,":[61],"ultrasound,":[62],"an":[63],"viable":[65],"very":[67],"low":[68],"side":[69],"effects":[70],"imaging":[72],"technique,":[73],"largely":[76],"overlooked":[77],"by":[78],"researchers.":[79],"This":[80],"study":[81],"introduces":[82],"a":[83,139,146,152],"high-quality":[84,121,140,159],"instruction-tuned":[85],"Large":[86,147],"vision":[87],"Language":[88],"Assistant":[89],"for":[90,186],"UltraSound":[91],"(LLAUS),":[92],"designed":[93],"answer":[95],"questions":[96],"about":[97],"ultrasound":[99,122,166,172,187],"images,":[100,188],"aiming":[101],"assist":[103],"clinicians":[104],"impoverished":[106],"areas":[107],"improve":[109],"provision":[111],"healthcare":[113],"services.":[114],"To":[115],"address":[116],"challenge":[118],"missing":[120],"data,":[123],"we":[124,144],"propose":[125],"Adaptive":[127,131],"Caption":[128,132],"Enhancement(ACE)":[129],"Optimization":[133],"(ACO)":[134],"strategies":[135],"developed":[138],"instruction-following":[141,160],"dataset.":[142],"Subsequently,":[143],"fine-tune":[145],"Vision-Language":[148],"Model":[149],"(LVLM)":[150],"using":[151],"novel":[153],"Zoom-In":[154],"method.":[155],"By":[156],"training":[157],"datas,":[161],"LLAUS":[162,189],"demonstrates":[163],"exceptional":[164],"communication":[167],"capabilities,":[168],"assisting":[169],"querying":[171],"images":[173],"based":[174],"open-ended":[176],"instructions.":[177],"On":[178],"tasks":[179],"related":[180],"question-answering":[182],"caption":[184],"generation":[185],"exhibits":[190],"strong":[191],"performance.":[192]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
