{"id":"https://openalex.org/W4416036950","doi":"https://doi.org/10.18653/v1/2025.emnlp-main.315","title":"RAV: Retrieval-Augmented Voting for Tactile Descriptions Without Training","display_name":"RAV: Retrieval-Augmented Voting for Tactile Descriptions Without Training","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4416036950","doi":"https://doi.org/10.18653/v1/2025.emnlp-main.315"},"language":null,"primary_location":{"id":"doi:10.18653/v1/2025.emnlp-main.315","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.emnlp-main.315","pdf_url":"https://aclanthology.org/2025.emnlp-main.315.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2025.emnlp-main.315.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101790108","display_name":"Jinlin Wang","orcid":"https://orcid.org/0000-0003-1113-5835"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Jinlin Wang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085604594","display_name":"Yulong Ji","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yulong Ji","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100542752","display_name":"Yang Hongyu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hongyu Yang","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5101790108"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.34713346,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"6198","last_page":"6205"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.47690001130104065,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.47690001130104065,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.07530000060796738,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.07100000232458115,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.6412000060081482},{"id":"https://openalex.org/keywords/voting","display_name":"Voting","score":0.4239000082015991},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.2655999958515167},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.2524999976158142},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.24729999899864197}],"concepts":[{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.6412000060081482},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4860999882221222},{"id":"https://openalex.org/C520049643","wikidata":"https://www.wikidata.org/wiki/Q189760","display_name":"Voting","level":3,"score":0.4239000082015991},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3894999921321869},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.35249999165534973},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.2655999958515167},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.2524999976158142},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.24729999899864197},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.227400004863739},{"id":"https://openalex.org/C527412718","wikidata":"https://www.wikidata.org/wiki/Q855395","display_name":"Interpretation (philosophy)","level":2,"score":0.2240999937057495}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/2025.emnlp-main.315","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.emnlp-main.315","pdf_url":"https://aclanthology.org/2025.emnlp-main.315.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/2025.emnlp-main.315","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.emnlp-main.315","pdf_url":"https://aclanthology.org/2025.emnlp-main.315.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320322990","display_name":"Sichuan University","ror":"https://ror.org/011ashp19"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4416036950.pdf","grobid_xml":"https://content.openalex.org/works/W4416036950.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Tactile":[0],"perception":[1,33],"is":[2,14],"essential":[3],"for":[4,18,31,59],"humanenvironment":[5],"interaction,":[6],"and":[7,36,62,65,81,101,116],"deriving":[8],"tactile":[9,63,67],"descriptions":[10,68],"from":[11],"multimodal":[12,32],"data":[13,58,102,110],"a":[15,46,70],"key":[16],"challenge":[17],"embodied":[19],"intelligence":[20],"to":[21,86],"understand":[22],"human":[23],"perception.Conventional":[24],"approaches":[25],"relying":[26],"on":[27],"extensive":[28],"parameter":[29],"learning":[30],"are":[34,119],"rigid":[35],"computationally":[37],"inefficient.To":[38],"address":[39],"this,":[40],"we":[41,74],"introduce":[42],"Retrieval-Augmented":[43],"Voting":[44],"(RAV),":[45],"parameter-free":[47],"method":[48],"that":[49,104],"constructs":[50],"visualtactile":[51],"cross-modal":[52],"knowledge":[53],"directly.RAV":[54],"retrieves":[55],"similar":[56],"visual-tactile":[57],"given":[60],"visual":[61],"inputs":[64],"generates":[66],"through":[69],"voting":[71,77],"mechanism.In":[72],"experiments,":[73],"applied":[75],"three":[76],"strategies,":[78],"SyncVote,":[79],"DualVote":[80],"WeightVote,":[82],"achieving":[83],"performance":[84,106],"comparable":[85],"large-scale":[87],"crossmodal":[88],"models":[89],"without":[90],"training.Comparative":[91],"experiments":[92],"across":[93],"datasets":[94],"of":[95],"varying":[96],"quality-defined":[97],"by":[98],"annotation":[99],"accuracy":[100],"diversity-demonstrate":[103],"RAV's":[105],"improves":[107],"with":[108],"higher-quality":[109],"at":[111,121],"no":[112],"additional":[113],"computational":[114],"cost.Code,":[115],"model":[117],"checkpoints":[118],"opensourced":[120],"https:":[122],"//github.com/PluteW/RAV.":[123]},"counts_by_year":[],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-11-08T00:00:00"}
