{"id":"https://openalex.org/W4205178067","doi":"https://doi.org/10.1109/tcds.2021.3139543","title":"Vision-and-Language Navigation Based on Cross-Modal Feature Fusion in Indoor Environment","display_name":"Vision-and-Language Navigation Based on Cross-Modal Feature Fusion in Indoor Environment","publication_year":2021,"publication_date":"2021-12-31","ids":{"openalex":"https://openalex.org/W4205178067","doi":"https://doi.org/10.1109/tcds.2021.3139543"},"language":"en","primary_location":{"id":"doi:10.1109/tcds.2021.3139543","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcds.2021.3139543","pdf_url":null,"source":{"id":"https://openalex.org/S2488537894","display_name":"IEEE Transactions on Cognitive and Developmental Systems","issn_l":"2379-8920","issn":["2379-8920","2379-8939"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cognitive and Developmental Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067200719","display_name":"Shuhuan Wen","orcid":"https://orcid.org/0000-0002-7646-4958"},"institutions":[{"id":"https://openalex.org/I39333907","display_name":"Yanshan University","ror":"https://ror.org/02txfnf15","country_code":"CN","type":"education","lineage":["https://openalex.org/I39333907"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuhuan Wen","raw_affiliation_strings":["Engineering Research Center of the Ministry of Education for Intelligent Control System and Intelligent Equipment and the Key Laboratory of Industrial Computer Control Engineering of Hebei Province, Yanshan University, Qinhuangdao, China"],"raw_orcid":"https://orcid.org/0000-0002-7646-4958","affiliations":[{"raw_affiliation_string":"Engineering Research Center of the Ministry of Education for Intelligent Control System and Intelligent Equipment and the Key Laboratory of Industrial Computer Control Engineering of Hebei Province, Yanshan University, Qinhuangdao, China","institution_ids":["https://openalex.org/I39333907"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055011853","display_name":"Xiaohan Lv","orcid":null},"institutions":[{"id":"https://openalex.org/I39333907","display_name":"Yanshan University","ror":"https://ror.org/02txfnf15","country_code":"CN","type":"education","lineage":["https://openalex.org/I39333907"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaohan Lv","raw_affiliation_strings":["Engineering Research Center of the Ministry of Education for Intelligent Control System and Intelligent Equipment and the Key Laboratory of Industrial Computer Control Engineering of Hebei Province, Yanshan University, Qinhuangdao, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Engineering Research Center of the Ministry of Education for Intelligent Control System and Intelligent Equipment and the Key Laboratory of Industrial Computer Control Engineering of Hebei Province, Yanshan University, Qinhuangdao, China","institution_ids":["https://openalex.org/I39333907"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100420016","display_name":"F. Richard Yu","orcid":"https://orcid.org/0000-0003-1006-7594"},"institutions":[{"id":"https://openalex.org/I67031392","display_name":"Carleton University","ror":"https://ror.org/02qtvee93","country_code":"CA","type":"education","lineage":["https://openalex.org/I67031392"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"F. Richard Yu","raw_affiliation_strings":["Department of Systems and Computer Engineering, Carleton University, Ottawa, ON, Canada"],"raw_orcid":"https://orcid.org/0000-0003-1006-7594","affiliations":[{"raw_affiliation_string":"Department of Systems and Computer Engineering, Carleton University, Ottawa, ON, Canada","institution_ids":["https://openalex.org/I67031392"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5006081929","display_name":"Simeng Gong","orcid":"https://orcid.org/0000-0003-1449-1077"},"institutions":[{"id":"https://openalex.org/I39333907","display_name":"Yanshan University","ror":"https://ror.org/02txfnf15","country_code":"CN","type":"education","lineage":["https://openalex.org/I39333907"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Simeng Gong","raw_affiliation_strings":["Engineering Research Center of the Ministry of Education for Intelligent Control System and Intelligent Equipment and the Key Laboratory of Industrial Computer Control Engineering of Hebei Province, Yanshan University, Qinhuangdao, China"],"raw_orcid":"https://orcid.org/0000-0003-1449-1077","affiliations":[{"raw_affiliation_string":"Engineering Research Center of the Ministry of Education for Intelligent Control System and Intelligent Equipment and the Key Laboratory of Industrial Computer Control Engineering of Hebei Province, Yanshan University, Qinhuangdao, China","institution_ids":["https://openalex.org/I39333907"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.8733,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.76511279,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"15","issue":"1","first_page":"3","last_page":"15"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9854000210762024,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8848294615745544},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5922917127609253},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5711476802825928},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.5141330361366272},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5042001008987427},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.49416306614875793},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.4311476945877075},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.4212307035923004},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4128412902355194},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.35217350721359253}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8848294615745544},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5922917127609253},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5711476802825928},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.5141330361366272},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5042001008987427},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.49416306614875793},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.4311476945877075},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.4212307035923004},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4128412902355194},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.35217350721359253},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcds.2021.3139543","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcds.2021.3139543","pdf_url":null,"source":{"id":"https://openalex.org/S2488537894","display_name":"IEEE Transactions on Cognitive and Developmental Systems","issn_l":"2379-8920","issn":["2379-8920","2379-8939"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cognitive and Developmental Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.7799999713897705}],"awards":[{"id":"https://openalex.org/G5384475345","display_name":null,"funder_award_id":"62111530148","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6914846217","display_name":null,"funder_award_id":"61773333","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7208349460","display_name":null,"funder_award_id":"201908130016","funder_id":"https://openalex.org/F4320322725","funder_display_name":"China Scholarship Council"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322725","display_name":"China Scholarship Council","ror":"https://ror.org/04atp4p48"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W2605127024","https://openalex.org/W2607750299","https://openalex.org/W2636355936","https://openalex.org/W2807172739","https://openalex.org/W2890902815","https://openalex.org/W2896457183","https://openalex.org/W2926977875","https://openalex.org/W2951973805","https://openalex.org/W2962744691","https://openalex.org/W2963367210","https://openalex.org/W2963451844","https://openalex.org/W2963800628","https://openalex.org/W2964935470","https://openalex.org/W2967186499","https://openalex.org/W2968124245","https://openalex.org/W2969332757","https://openalex.org/W2969876226","https://openalex.org/W2970231061","https://openalex.org/W2970869018","https://openalex.org/W2974759213","https://openalex.org/W2996781902","https://openalex.org/W2999770866","https://openalex.org/W3034578524","https://openalex.org/W3035232877","https://openalex.org/W3098581361","https://openalex.org/W3106806814","https://openalex.org/W3108144224","https://openalex.org/W4297798492","https://openalex.org/W6692846177","https://openalex.org/W6719057275","https://openalex.org/W6739847781","https://openalex.org/W6739901393","https://openalex.org/W6751885507","https://openalex.org/W6752017656","https://openalex.org/W6755207826","https://openalex.org/W6757724268","https://openalex.org/W6759380828","https://openalex.org/W6766904570","https://openalex.org/W6767211374","https://openalex.org/W6767279747","https://openalex.org/W6786772999"],"related_works":["https://openalex.org/W4323768008","https://openalex.org/W1941703695","https://openalex.org/W3131574667","https://openalex.org/W4360995134","https://openalex.org/W4248382324","https://openalex.org/W3023605104","https://openalex.org/W2039473718","https://openalex.org/W2387529410","https://openalex.org/W2383578611","https://openalex.org/W3098003361"],"abstract_inverted_index":{"It":[0],"is":[1,57,102],"challenging":[2],"for":[3],"an":[4,75],"agent":[5,31,60,140,161,170,195,220,281],"to":[6,16,28,32,54,62,78,104,128,154,188,196,203],"simultaneously":[7],"decipher":[8],"visual":[9,43,90,113,122],"and":[10,13,39,72,92,118,133,211,224,234,247,249,290,298],"language":[11,37,73,93,116,119],"information":[12,45,65,117],"make":[14],"decisions":[15],"perform":[17],"corresponding":[18],"actions.":[19],"Recently,":[20],"the":[21,30,40,59,64,67,86,107,126,135,143,147,150,156,160,169,172,184,190,194,198,206,209,213,216,219,229,235,260,265,273,277,280,284,287],"vision-and-language":[22],"navigation":[23,148,288],"task":[24,56],"has":[25],"been":[26],"proposed":[27,261,274],"allow":[29],"navigate":[33,79],"based":[34,182,254,263],"on":[35,183,255,264],"a":[36,47,96,178,292],"instruction":[38],"currently":[41],"visible":[42],"point":[44],"in":[46,74,221,296],"3-D":[48],"indoor":[49],"real":[50],"environment.":[51],"The":[52,269],"key":[53],"this":[55,82,256],"that":[58,112,168,272],"needs":[61],"understand":[63],"of":[66,70,139,146,149,159,193,208,218,279,286],"two":[68],"models":[69],"vision":[71],"unknown":[76,225,299],"environment":[77],"effectively.":[80],"In":[81,201],"study,":[83],"we":[84,152,227],"capture":[85],"alignment":[87],"relationship":[88],"between":[89,215],"features":[91,94,114,120],"using":[95],"cross-modal":[97,108],"feature":[98,131],"fusion":[99,109],"method.":[100,257],"Attention":[101],"used":[103],"set":[105],"up":[106],"module":[110],"so":[111],"contain":[115,121],"information,":[123],"thereby":[124],"allowing":[125],"model":[127,210],"learn":[129],"more":[130],"relationships":[132],"improving":[134],"success":[136],"rate":[137],"(SR)":[138],"navigation.":[141],"Considering":[142],"practical":[144],"significance":[145],"agent,":[151],"aim":[153],"shorten":[155,197],"trajectory":[157,199],"length":[158,285],"as":[162,164],"much":[163],"possible":[165],"while":[166],"ensuring":[167],"reaches":[171],"target":[173],"position":[174],"successfully.":[175],"We":[176,258],"employ":[177],"reinforcement":[179],"learning":[180],"algorithm":[181],"advantage":[185],"actor":[186],"critic":[187],"constrain":[189],"action":[191],"selection":[192],"length.":[200],"order":[202],"further":[204],"improve":[205],"performance":[207,217,295],"reduce":[212],"difference":[214],"known":[222,297],"environments":[223],"environments,":[226],"propose":[228],"data":[230,240,244,251,267],"augmentation":[231,241,245,252],"method":[232,262,275],"Cro-Speaker,":[233],"three":[236],"training":[237],"methods":[238],"Speaker":[239,248],"(SD),":[242],"Cro-Speaker":[243,250],"(CSD),":[246],"(SCSD)":[253],"evaluate":[259],"Room-to-Room":[266],"set.":[268],"results":[270],"show":[271],"improves":[276],"SR":[278],"navigation,":[282],"shortens":[283],"trajectory,":[289],"exhibits":[291],"good":[293],"generalization":[294],"environments.":[300]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":2}],"updated_date":"2026-06-19T17:40:00.097472","created_date":"2025-10-10T00:00:00"}
