{"id":"https://openalex.org/W7158827398","doi":"https://doi.org/10.1109/access.2026.3687477","title":"GPT Sonography: Hand Gesture Decoding From Forearm Ultrasound Images via a Large Vision-Language Model","display_name":"GPT Sonography: Hand Gesture Decoding From Forearm Ultrasound Images via a Large Vision-Language Model","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7158827398","doi":"https://doi.org/10.1109/access.2026.3687477"},"language":"en","primary_location":{"id":"doi:10.1109/access.2026.3687477","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2026.3687477","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2026.3687477","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064913985","display_name":"Keshav Bimbraw","orcid":"https://orcid.org/0000-0003-3735-7700"},"institutions":[{"id":"https://openalex.org/I107077323","display_name":"Worcester Polytechnic Institute","ror":"https://ror.org/05ejpqr48","country_code":"US","type":"education","lineage":["https://openalex.org/I107077323"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Keshav Bimbraw","raw_affiliation_strings":["Worcester Polytechnic Institute, Worcester, MA, USA"],"raw_orcid":"https://orcid.org/0000-0003-3735-7700","affiliations":[{"raw_affiliation_string":"Worcester Polytechnic Institute, Worcester, MA, USA","institution_ids":["https://openalex.org/I107077323"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134903118","display_name":"Ye Wang","orcid":"https://orcid.org/0000-0001-5220-1830"},"institutions":[{"id":"https://openalex.org/I4210159266","display_name":"Mitsubishi Electric (United States)","ror":"https://ror.org/053jnhe44","country_code":"US","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125","https://openalex.org/I4210159266"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ye Wang","raw_affiliation_strings":["Mitsubishi Electric Research Laboratories (MERL), Cambridge, MA, USA"],"raw_orcid":"https://orcid.org/0000-0001-5220-1830","affiliations":[{"raw_affiliation_string":"Mitsubishi Electric Research Laboratories (MERL), Cambridge, MA, USA","institution_ids":["https://openalex.org/I4210159266"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134893430","display_name":"Jing Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210159266","display_name":"Mitsubishi Electric (United States)","ror":"https://ror.org/053jnhe44","country_code":"US","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125","https://openalex.org/I4210159266"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jing Liu","raw_affiliation_strings":["Mitsubishi Electric Research Laboratories (MERL), Cambridge, MA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Mitsubishi Electric Research Laboratories (MERL), Cambridge, MA, USA","institution_ids":["https://openalex.org/I4210159266"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5023338067","display_name":"Toshiaki Koike\u2013Akino","orcid":"https://orcid.org/0000-0002-2578-5372"},"institutions":[{"id":"https://openalex.org/I4210159266","display_name":"Mitsubishi Electric (United States)","ror":"https://ror.org/053jnhe44","country_code":"US","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125","https://openalex.org/I4210159266"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Toshiaki Koike-Akino","raw_affiliation_strings":["Mitsubishi Electric Research Laboratories (MERL), Cambridge, MA, USA"],"raw_orcid":"https://orcid.org/0000-0002-2578-5372","affiliations":[{"raw_affiliation_string":"Mitsubishi Electric Research Laboratories (MERL), Cambridge, MA, USA","institution_ids":["https://openalex.org/I4210159266"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.64140517,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"14","issue":null,"first_page":"70724","last_page":"70736"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.13600000739097595,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.13600000739097595,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10784","display_name":"Muscle activation and electromyography studies","score":0.08810000121593475,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.027400000020861626,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.620199978351593},{"id":"https://openalex.org/keywords/forearm","display_name":"Forearm","score":0.4909000098705292},{"id":"https://openalex.org/keywords/gesture","display_name":"Gesture","score":0.4429999887943268},{"id":"https://openalex.org/keywords/ultrasonic-imaging","display_name":"Ultrasonic imaging","score":0.4065000116825104},{"id":"https://openalex.org/keywords/ultrasound","display_name":"Ultrasound","score":0.35910001397132874},{"id":"https://openalex.org/keywords/medical-imaging","display_name":"Medical imaging","score":0.35659998655319214},{"id":"https://openalex.org/keywords/gesture-recognition","display_name":"Gesture recognition","score":0.34310001134872437}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7390999794006348},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6312999725341797},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.620199978351593},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5952000021934509},{"id":"https://openalex.org/C2780214079","wikidata":"https://www.wikidata.org/wiki/Q228537","display_name":"Forearm","level":2,"score":0.4909000098705292},{"id":"https://openalex.org/C207347870","wikidata":"https://www.wikidata.org/wiki/Q371174","display_name":"Gesture","level":2,"score":0.4429999887943268},{"id":"https://openalex.org/C2989478337","wikidata":"https://www.wikidata.org/wiki/Q234904","display_name":"Ultrasonic imaging","level":3,"score":0.4065000116825104},{"id":"https://openalex.org/C143753070","wikidata":"https://www.wikidata.org/wiki/Q162564","display_name":"Ultrasound","level":2,"score":0.35910001397132874},{"id":"https://openalex.org/C31601959","wikidata":"https://www.wikidata.org/wiki/Q931309","display_name":"Medical imaging","level":2,"score":0.35659998655319214},{"id":"https://openalex.org/C159437735","wikidata":"https://www.wikidata.org/wiki/Q1519524","display_name":"Gesture recognition","level":3,"score":0.34310001134872437},{"id":"https://openalex.org/C2986892559","wikidata":"https://www.wikidata.org/wiki/Q234904","display_name":"Ultrasound imaging","level":3,"score":0.32659998536109924},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.29420000314712524},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.2770000100135803},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.26339998841285706},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.2590000033378601},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.25369998812675476},{"id":"https://openalex.org/C141379421","wikidata":"https://www.wikidata.org/wiki/Q6094427","display_name":"Iterative reconstruction","level":2,"score":0.25119999051094055}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2026.3687477","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2026.3687477","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:811528bf94a54b9ea6014a8ee7654db8","is_oa":true,"landing_page_url":"https://doaj.org/article/811528bf94a54b9ea6014a8ee7654db8","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 14, Pp 70724-70736 (2026)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2026.3687477","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2026.3687477","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320315072","display_name":"Mitsubishi Electric Research Laboratories","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"vision-language":[1],"models":[2,16,41,67,97],"(LVLMs),":[3],"such":[4,39],"as":[5,21],"the":[6,78,132,158],"Generative":[7],"Pre-trained":[8],"Transformer":[9],"4-omni":[10],"(GPT-4o),":[11],"are":[12],"emerging":[13],"multi-modal":[14],"foundation":[15,40,66],"which":[17],"have":[18],"great":[19],"potential":[20,159],"powerful":[22],"artificial-intelligence":[23],"(AI)":[24],"assistance":[25],"tools":[26],"for":[27,86,143,153,162],"a":[28,45,99],"myriad":[29],"of":[30,48,64,102,160],"applications,":[31],"including":[32],"healthcare,":[33],"industrial,":[34],"and":[35,121,146,180,191],"academic":[36],"sectors.":[37],"Although":[38],"perform":[42],"well":[43],"in":[44,58],"wide":[46],"range":[47],"general":[49],"tasks,":[50],"their":[51],"capability":[52],"without":[53,198],"fine-tuning":[54,63],"is":[55,68],"often":[56],"limited":[57],"specialized":[59],"tasks.":[60],"However,":[61,90],"full":[62],"large":[65,100,181],"challenging":[69],"due":[70],"to":[71,83,140,150,170],"enormous":[72],"computation/memory/dataset":[73],"requirements.":[74],"Ultrasound":[75],"data":[76,116],"from":[77,113,137,147],"forearm":[79,114],"has":[80],"been":[81],"shown":[82],"be":[84],"used":[85],"hand":[87,111],"gesture":[88,164,173],"estimation.":[89],"this":[91],"typically":[92],"requires":[93],"training":[94,179],"deep":[95],"learning":[96,190],"with":[98,118,123],"quantity":[101],"labeled":[103,182],"data.":[104],"We":[105],"show":[106,186],"that":[107,175,187],"GPT-4o":[108],"can":[109,194],"decode":[110],"gestures":[112],"ultrasound":[115,172],"even":[117],"no":[119],"fine-tuning,":[120],"improves":[122],"few-shot,":[124],"retrieval":[125],"augmented":[126],"in-context":[127,189],"learning.":[128],"In":[129],"our":[130],"experiments,":[131],"average":[133],"classification":[134],"accuracy":[135],"improved":[136],"19.3%":[138],"(0-shot)":[139,149],"74.0%":[141],"(2-shot)":[142],"within-session":[144],"testing,":[145],"20.0%":[148],"61.3%":[151],"(3-shot)":[152],"cross-session":[154],"testing.":[155],"This":[156],"demonstrates":[157],"LVLMs":[161],"ultrasound-based":[163],"recognition":[165],"by":[166],"enabling":[167],"an":[168],"alternative":[169],"prior":[171],"pipelines":[174],"require":[176],"dedicated":[177],"model":[178,200],"datasets.":[183],"Additionally,":[184],"we":[185],"few-shot":[188],"retrieval-augmented":[192],"selection":[193],"substantially":[195],"improve":[196],"performance":[197],"any":[199],"fine-tuning.":[201]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-01T00:00:00"}
