{"id":"https://openalex.org/W4417470373","doi":"https://doi.org/10.1109/tmm.2025.3645596","title":"VikitaFusion: Object Recognition Based on Heterogeneous Visual-Kinesthetic-Tactile Information","display_name":"VikitaFusion: Object Recognition Based on Heterogeneous Visual-Kinesthetic-Tactile Information","publication_year":2025,"publication_date":"2025-12-18","ids":{"openalex":"https://openalex.org/W4417470373","doi":"https://doi.org/10.1109/tmm.2025.3645596"},"language":null,"primary_location":{"id":"doi:10.1109/tmm.2025.3645596","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2025.3645596","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5026496427","display_name":"R S Zhang","orcid":"https://orcid.org/0009-0008-2494-1063"},"institutions":[{"id":"https://openalex.org/I80947539","display_name":"Fuzhou University","ror":"https://ror.org/011xvna82","country_code":"CN","type":"education","lineage":["https://openalex.org/I80947539"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Rouqi Zhang","raw_affiliation_strings":["Fujian Key Lab for Intelligent Processing and Wireless Transmission of Media Information, Fuzhou University, Fuzhou, China"],"affiliations":[{"raw_affiliation_string":"Fujian Key Lab for Intelligent Processing and Wireless Transmission of Media Information, Fuzhou University, Fuzhou, China","institution_ids":["https://openalex.org/I80947539"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102992609","display_name":"Ting Zhang","orcid":"https://orcid.org/0009-0009-7170-253X"},"institutions":[{"id":"https://openalex.org/I80947539","display_name":"Fuzhou University","ror":"https://ror.org/011xvna82","country_code":"CN","type":"education","lineage":["https://openalex.org/I80947539"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ting Zhang","raw_affiliation_strings":["Fujian Key Lab for Intelligent Processing and Wireless Transmission of Media Information, Fuzhou University, Fuzhou, China"],"affiliations":[{"raw_affiliation_string":"Fujian Key Lab for Intelligent Processing and Wireless Transmission of Media Information, Fuzhou University, Fuzhou, China","institution_ids":["https://openalex.org/I80947539"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059963421","display_name":"Jinde Zhu","orcid":"https://orcid.org/0000-0003-0359-1267"},"institutions":[{"id":"https://openalex.org/I83791580","display_name":"Fujian University of Technology","ror":"https://ror.org/03c8fdb16","country_code":"CN","type":"education","lineage":["https://openalex.org/I83791580"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinde Zhu","raw_affiliation_strings":["School of Computer Science and Mathematics, Fujian University of Technology, Fuzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Mathematics, Fujian University of Technology, Fuzhou, China","institution_ids":["https://openalex.org/I83791580"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016217185","display_name":"Weiling Chen","orcid":"https://orcid.org/0000-0002-1400-1659"},"institutions":[{"id":"https://openalex.org/I80947539","display_name":"Fuzhou University","ror":"https://ror.org/011xvna82","country_code":"CN","type":"education","lineage":["https://openalex.org/I80947539"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weiling Chen","raw_affiliation_strings":["Fujian Key Lab for Intelligent Processing and Wireless Transmission of Media Information, Fuzhou University, Fuzhou, China"],"affiliations":[{"raw_affiliation_string":"Fujian Key Lab for Intelligent Processing and Wireless Transmission of Media Information, Fuzhou University, Fuzhou, China","institution_ids":["https://openalex.org/I80947539"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5057108758","display_name":"Tiesong Zhao","orcid":"https://orcid.org/0000-0002-7497-8883"},"institutions":[{"id":"https://openalex.org/I80947539","display_name":"Fuzhou University","ror":"https://ror.org/011xvna82","country_code":"CN","type":"education","lineage":["https://openalex.org/I80947539"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tiesong Zhao","raw_affiliation_strings":["Fujian Key Lab for Intelligent Processing and Wireless Transmission of Media Information, Fuzhou University, Fuzhou, China"],"affiliations":[{"raw_affiliation_string":"Fujian Key Lab for Intelligent Processing and Wireless Transmission of Media Information, Fuzhou University, Fuzhou, China","institution_ids":["https://openalex.org/I80947539"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5026496427"],"corresponding_institution_ids":["https://openalex.org/I80947539"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.40205639,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"28","issue":null,"first_page":"1909","last_page":"1920"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10338","display_name":"Advanced Sensor and Energy Harvesting Materials","score":0.48579999804496765,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10338","display_name":"Advanced Sensor and Energy Harvesting Materials","score":0.48579999804496765,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10914","display_name":"Tactile and Sensory Interactions","score":0.09610000252723694,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.0625,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/kinesthetic-learning","display_name":"Kinesthetic learning","score":0.7627999782562256},{"id":"https://openalex.org/keywords/sensor-fusion","display_name":"Sensor fusion","score":0.6208999752998352},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.5573999881744385},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.46880000829696655},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.44190001487731934},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.42739999294281006},{"id":"https://openalex.org/keywords/cognitive-neuroscience-of-visual-object-recognition","display_name":"Cognitive neuroscience of visual object recognition","score":0.41839998960494995},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4041000008583069},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.36899998784065247}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8411999940872192},{"id":"https://openalex.org/C55457006","wikidata":"https://www.wikidata.org/wiki/Q3647098","display_name":"Kinesthetic learning","level":2,"score":0.7627999782562256},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6606000065803528},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.6208999752998352},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.5573999881744385},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.46880000829696655},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.44190001487731934},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.42739999294281006},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4194999933242798},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.41839998960494995},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4041000008583069},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.36899998784065247},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.36559998989105225},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.352400004863739},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.351500004529953},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.3361000120639801},{"id":"https://openalex.org/C135981907","wikidata":"https://www.wikidata.org/wiki/Q188056","display_name":"Triangulation","level":2,"score":0.33489999175071716},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.32899999618530273},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.3203999996185303},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3140999972820282},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.29510000348091125},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.29019999504089355},{"id":"https://openalex.org/C178253425","wikidata":"https://www.wikidata.org/wiki/Q162668","display_name":"Visual perception","level":3,"score":0.2786000072956085},{"id":"https://openalex.org/C121687571","wikidata":"https://www.wikidata.org/wiki/Q4677630","display_name":"Activity recognition","level":2,"score":0.27090001106262207},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.2653999924659729},{"id":"https://openalex.org/C173414695","wikidata":"https://www.wikidata.org/wiki/Q5510276","display_name":"Fusion mechanism","level":4,"score":0.2524000108242035}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2025.3645596","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2025.3645596","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W1531333757","https://openalex.org/W2064675550","https://openalex.org/W2075654868","https://openalex.org/W2183341477","https://openalex.org/W2194775991","https://openalex.org/W2344531169","https://openalex.org/W2725171488","https://openalex.org/W2775635818","https://openalex.org/W2811204324","https://openalex.org/W2883780447","https://openalex.org/W2952866402","https://openalex.org/W2963446712","https://openalex.org/W2963654998","https://openalex.org/W2963915174","https://openalex.org/W2963918968","https://openalex.org/W2964054038","https://openalex.org/W2982083293","https://openalex.org/W3020895012","https://openalex.org/W3034429256","https://openalex.org/W3110666852","https://openalex.org/W3128880094","https://openalex.org/W3138516171","https://openalex.org/W4225966488","https://openalex.org/W4246193833","https://openalex.org/W4285132138","https://openalex.org/W4312349930","https://openalex.org/W4312443924","https://openalex.org/W4312847199","https://openalex.org/W4320713352","https://openalex.org/W4327630646","https://openalex.org/W4377231435","https://openalex.org/W4382119137","https://openalex.org/W4386939388","https://openalex.org/W4387805864","https://openalex.org/W4394597793","https://openalex.org/W4399528595","https://openalex.org/W4402354011","https://openalex.org/W4402703046","https://openalex.org/W4402726993","https://openalex.org/W4402775306","https://openalex.org/W4402968400","https://openalex.org/W4404708922","https://openalex.org/W4416748821"],"related_works":[],"abstract_inverted_index":{"Kinesthetic":[0],"and":[1,16,39,54,77,111,134,174],"tactile":[2,53,110],"information":[3,32],"can":[4,23],"represent":[5],"the":[6,49,65,71,78,149,187],"physical":[7],"states":[8],"of":[9,21,35,67,73,80],"objects,":[10],"encompassing":[11],"roughness,":[12],"stiffness,":[13],"motion,":[14],"force,":[15],"other":[17],"attributes.":[18],"The":[19],"introduction":[20],"these":[22],"enhance":[24],"imprecise":[25],"recognition":[26,172],"that":[27,105,123,164],"relies":[28],"solely":[29],"on":[30],"visual":[31,107],"in":[33,155],"cases":[34],"light":[36],"disturbance,":[37],"occlusion":[38],"camouflage.":[40],"Nevertheless,":[41],"this":[42,59,61],"task":[43],"is":[44,97],"still":[45],"challenging":[46],"due":[47],"to":[48],"heterogeneity":[50],"among":[51],"visual,":[52],"kinesthetic":[55,112],"data.":[56],"To":[57],"address":[58],"issue,":[60],"paper":[62],"delves":[63],"into":[64],"alignment":[66],"heterogeneous":[68,74,85,102,157],"data":[69,75,103,113],"dimensions,":[70],"fusion":[72,122,127,132,136],"features,":[76],"optimization":[79],"learning":[81,87,150,159],"rates":[82],"for":[83,152],"multi-source":[84,156],"sensor":[86,158],"models.":[88,160],"Consequently,":[89],"an":[90],"effective":[91],"Visual-Kinesthetic-Tactile":[92],"Information":[93],"Fusion":[94],"(VikitaFusion)":[95],"network":[96],"proposed,":[98],"which":[99],"comprises:":[100],"1)":[101],"extractors":[104],"align":[106],"images":[108],"with":[109,170],"through":[114,129],"image-to-sequence":[115],"projection;":[116],"2)":[117],"a":[118,130,139,175],"visual-kinesthetic-tactile":[119],"Transformer-based":[120],"domain":[121],"mimics":[124],"human":[125],"multi-sensory":[126],"perception":[128],"feature-level":[131],"block":[133],"dynamic":[135],"blocks;":[137],"3)":[138],"Periodic":[140],"Triangulation":[141],"Learning":[142],"Rate":[143],"(PTLR)":[144],"method":[145],"aimed":[146],"at":[147],"optimizing":[148],"rate":[151],"performance":[153],"enhancement":[154],"Extensive":[161],"experiments":[162],"demonstrate":[163],"VikitaFusion":[165],"outperforms":[166],"current":[167],"state-of-the-art":[168],"methods":[169],"higher":[171],"accuracy":[173],"lower":[176],"parameter":[177],"size.":[178],"Source":[179],"code":[180],"will":[181],"be":[182],"made":[183],"publicly":[184],"available":[185],"after":[186],"peer":[188],"review":[189],"process.":[190]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-12-18T00:00:00"}
