{"id":"https://openalex.org/W4402722199","doi":"https://doi.org/10.1145/3641825.3687742","title":"Toward Facilitating Search in VR With the Assistance of Vision Large Language Models","display_name":"Toward Facilitating Search in VR With the Assistance of Vision Large Language Models","publication_year":2024,"publication_date":"2024-09-22","ids":{"openalex":"https://openalex.org/W4402722199","doi":"https://doi.org/10.1145/3641825.3687742"},"language":"en","primary_location":{"id":"doi:10.1145/3641825.3687742","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3641825.3687742","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"30th ACM Symposium on Virtual Reality Software and Technology","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Chao Liu","orcid":"https://orcid.org/0009-0003-6735-3492"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Chao Liu","raw_affiliation_strings":["Computational Media and Arts Thrust, The Hong Kong University of Science and Technology (Guangzhou), China"],"raw_orcid":"https://orcid.org/0009-0003-6735-3492","affiliations":[{"raw_affiliation_string":"Computational Media and Arts Thrust, The Hong Kong University of Science and Technology (Guangzhou), China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004272501","display_name":"Chi San Cheung","orcid":"https://orcid.org/0009-0005-6233-3884"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Chi San (Clarence) Cheung","raw_affiliation_strings":["Academy of Interdisciplinary Studies, The Hong Kong University of Science and Technology, China"],"raw_orcid":"https://orcid.org/0009-0005-6233-3884","affiliations":[{"raw_affiliation_string":"Academy of Interdisciplinary Studies, The Hong Kong University of Science and Technology, China","institution_ids":["https://openalex.org/I200769079"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013217445","display_name":"Mingqing Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mingqing Xu","raw_affiliation_strings":["Computational Media and Arts Thrust, The Hong Kong University of Science and Technology (Guangzhou), China"],"raw_orcid":"https://orcid.org/0009-0008-2447-8793","affiliations":[{"raw_affiliation_string":"Computational Media and Arts Thrust, The Hong Kong University of Science and Technology (Guangzhou), China","institution_ids":[]}]},{"author_position":"middle","author":{"id":null,"display_name":"Zhongyue Zhang","orcid":"https://orcid.org/0009-0001-1232-004X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhongyue Zhang","raw_affiliation_strings":["Computational Media and Arts Thrust, The Hong Kong University of Science and Technology (Guangzhou), China"],"raw_orcid":"https://orcid.org/0009-0001-1232-004X","affiliations":[{"raw_affiliation_string":"Computational Media and Arts Thrust, The Hong Kong University of Science and Technology (Guangzhou), China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103180236","display_name":"Ming\u2010Yang Su","orcid":"https://orcid.org/0009-0006-3281-7594"},"institutions":[{"id":"https://openalex.org/I4210114105","display_name":"Tsinghua\u2013Berkeley Shenzhen Institute","ror":"https://ror.org/02hhwwz98","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210114105","https://openalex.org/I95457486","https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingyang Su","raw_affiliation_strings":["Tsinghua Shenzhen International Graduate School, China"],"raw_orcid":"https://orcid.org/0009-0006-3281-7594","affiliations":[{"raw_affiliation_string":"Tsinghua Shenzhen International Graduate School, China","institution_ids":["https://openalex.org/I4210114105"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5048919402","display_name":"Mingming Fan","orcid":"https://orcid.org/0000-0002-0356-4712"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mingming Fan","raw_affiliation_strings":["The Hong Kong University of Science and Technology (Guangzhou), China and The Hong Kong University of Science and Technology, China"],"raw_orcid":"https://orcid.org/0000-0002-0356-4712","affiliations":[{"raw_affiliation_string":"The Hong Kong University of Science and Technology (Guangzhou), China and The Hong Kong University of Science and Technology, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.7142,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.7145752,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"14"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7457384467124939},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.6096578240394592},{"id":"https://openalex.org/keywords/virtual-reality","display_name":"Virtual reality","score":0.4431525468826294},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.34402841329574585},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3370494842529297}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7457384467124939},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.6096578240394592},{"id":"https://openalex.org/C194969405","wikidata":"https://www.wikidata.org/wiki/Q170519","display_name":"Virtual reality","level":2,"score":0.4431525468826294},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.34402841329574585},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3370494842529297}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3641825.3687742","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3641825.3687742","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"30th ACM Symposium on Virtual Reality Software and Technology","raw_type":"proceedings-article"},{"id":"pmh:oai:repository.hkust.edu.hk:1783.1-146774","is_oa":false,"landing_page_url":"http://repository.hkust.edu.hk/ir/Record/1783.1-146774","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Conference paper"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W1511160209","https://openalex.org/W2052992339","https://openalex.org/W2058310943","https://openalex.org/W2105981469","https://openalex.org/W2136925099","https://openalex.org/W2160368229","https://openalex.org/W2317966680","https://openalex.org/W2343703449","https://openalex.org/W2580237913","https://openalex.org/W2611760972","https://openalex.org/W2799116636","https://openalex.org/W2898714446","https://openalex.org/W2903015182","https://openalex.org/W2963470893","https://openalex.org/W2969210124","https://openalex.org/W2985033890","https://openalex.org/W3035064992","https://openalex.org/W3127403223","https://openalex.org/W3153665132","https://openalex.org/W3160033907","https://openalex.org/W3160592978","https://openalex.org/W3163688954","https://openalex.org/W3187571995","https://openalex.org/W3203211826","https://openalex.org/W4224298125","https://openalex.org/W4224981885","https://openalex.org/W4251196815","https://openalex.org/W4309674289","https://openalex.org/W4361806248","https://openalex.org/W4377164404","https://openalex.org/W4382491206","https://openalex.org/W4384890811","https://openalex.org/W4387251514","https://openalex.org/W4390154854","https://openalex.org/W4390692489","https://openalex.org/W4391114255","https://openalex.org/W4391558438","https://openalex.org/W4392405794","https://openalex.org/W4396831883","https://openalex.org/W4396832250","https://openalex.org/W4396832812","https://openalex.org/W4396833370","https://openalex.org/W4400374438"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052","https://openalex.org/W2059650074","https://openalex.org/W4285504728"],"abstract_inverted_index":{"While":[0,138],"search":[1,33,50,134,143,162],"is":[2],"a":[3,21,35,40,44,107,132],"common":[4,49],"need":[5],"in":[6,26,84,100,136,163],"Virtual":[7],"Reality":[8],"(VR)":[9],"applications,":[10],"current":[11],"approaches":[12],"are":[13],"cumbersome,":[14],"often":[15],"requiring":[16],"users":[17,111],"to":[18,32,112,128,145],"type":[19],"on":[20,34,116],"mid-air":[22],"keyboard":[23],"using":[24],"controllers":[25],"VR":[27,30,86,124,142,164],"or":[28],"remove":[29],"equipment":[31],"computer.":[36],"We":[37],"first":[38],"conducted":[39,106],"literature":[41],"review":[42],"and":[43,72,80,105,126,165],"formative":[45],"study,":[46],"identifying":[47],"six":[48],"needs:":[51],"knowing":[52,56,62,67],"about":[53,57,68,141],"one":[54],"object,":[55],"the":[58,85,117,159],"object\u2019s":[59],"partial":[60],"details,":[61],"objects":[63,74],"with":[64,70,110],"environmental":[65],"context,":[66],"interactions":[69],"objects,":[71],"finding":[73],"within":[75],"field":[76],"of":[77,82,149,161],"view":[78],"(FOV)":[79],"out":[81],"FOV":[83],"scene.":[87],"Informed":[88],"by":[89],"these":[90],"needs,":[91],"we":[92,119],"designed":[93],"technology":[94],"probes":[95],"that":[96],"leveraged":[97],"recent":[98],"advances":[99],"Vision":[101],"Large":[102],"Language":[103],"Models":[104],"probe-based":[108],"study":[109],"elicit":[113],"feedback.":[114],"Based":[115],"findings,":[118],"derived":[120],"design":[121,154],"principles":[122],"for":[123],"designers":[125],"developers":[127],"consider":[129],"when":[130],"designing":[131],"user-friendly":[133],"interface":[135],"VR.":[137],"prior":[139],"work":[140,152],"tended":[144],"address":[146],"specific":[147],"aspects":[148],"search,":[150],"our":[151],"contributes":[153],"considerations":[155],"aimed":[156],"at":[157],"enhancing":[158],"ease":[160],"potential":[166],"future":[167],"directions.":[168]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
