{"id":"https://openalex.org/W2927812634","doi":"https://doi.org/10.1109/tip.2020.2967584","title":"Revisiting EmbodiedQA: A Simple Baseline and Beyond","display_name":"Revisiting EmbodiedQA: A Simple Baseline and Beyond","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W2927812634","doi":"https://doi.org/10.1109/tip.2020.2967584","mag":"2927812634","pmid":"https://pubmed.ncbi.nlm.nih.gov/31995489"},"language":"en","primary_location":{"id":"doi:10.1109/tip.2020.2967584","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tip.2020.2967584","pdf_url":"https://ieeexplore.ieee.org/ielx7/83/8835130/08967238.pdf","source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://ieeexplore.ieee.org/ielx7/83/8835130/08967238.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Yu Wu","orcid":"https://orcid.org/0000-0002-1680-8253"},"institutions":[{"id":"https://openalex.org/I114017466","display_name":"University of Technology Sydney","ror":"https://ror.org/03f0f6041","country_code":"AU","type":"education","lineage":["https://openalex.org/I114017466"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Yu Wu","raw_affiliation_strings":["Center for Artificial Intelligence, University of Technology Sydney, Ultimo, Australia"],"raw_orcid":"https://orcid.org/0000-0002-1680-8253","affiliations":[{"raw_affiliation_string":"Center for Artificial Intelligence, University of Technology Sydney, Ultimo, Australia","institution_ids":["https://openalex.org/I114017466"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Lu Jiang","orcid":"https://orcid.org/0000-0003-0286-8439"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Lu Jiang","raw_affiliation_strings":["Google Research, Mountain View, USA"],"raw_orcid":"https://orcid.org/0000-0003-0286-8439","affiliations":[{"raw_affiliation_string":"Google Research, Mountain View, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"last","author":{"id":null,"display_name":"Yi Yang","orcid":"https://orcid.org/0000-0002-0512-880X"},"institutions":[{"id":"https://openalex.org/I114017466","display_name":"University of Technology Sydney","ror":"https://ror.org/03f0f6041","country_code":"AU","type":"education","lineage":["https://openalex.org/I114017466"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Yi Yang","raw_affiliation_strings":["Center for Artificial Intelligence, University of Technology Sydney, Ultimo, Australia"],"raw_orcid":"https://orcid.org/0000-0002-0512-880X","affiliations":[{"raw_affiliation_string":"Center for Artificial Intelligence, University of Technology Sydney, Ultimo, Australia","institution_ids":["https://openalex.org/I114017466"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I114017466"],"apc_list":null,"apc_paid":null,"fwci":1.9624,"has_fulltext":true,"cited_by_count":25,"citation_normalized_percentile":{"value":0.88319849,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"29","issue":null,"first_page":"3984","last_page":"3992"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.6470000147819519,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.6470000147819519,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.14139999449253082,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.026799999177455902,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.9053000211715698},{"id":"https://openalex.org/keywords/simple","display_name":"Simple (philosophy)","score":0.7777000069618225},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.6304000020027161},{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.5507000088691711},{"id":"https://openalex.org/keywords/upgrade","display_name":"Upgrade","score":0.5246999859809875},{"id":"https://openalex.org/keywords/distillation","display_name":"Distillation","score":0.4860999882221222}],"concepts":[{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.9053000211715698},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.7777000069618225},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7242000102996826},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.6304000020027161},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5641999840736389},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.5507000088691711},{"id":"https://openalex.org/C2780615140","wikidata":"https://www.wikidata.org/wiki/Q920419","display_name":"Upgrade","level":2,"score":0.5246999859809875},{"id":"https://openalex.org/C204030448","wikidata":"https://www.wikidata.org/wiki/Q101017","display_name":"Distillation","level":2,"score":0.4860999882221222},{"id":"https://openalex.org/C100609095","wikidata":"https://www.wikidata.org/wiki/Q1335050","display_name":"Embodied cognition","level":2,"score":0.4507000148296356},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.42080000042915344},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.34529998898506165},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.29100000858306885},{"id":"https://openalex.org/C151243789","wikidata":"https://www.wikidata.org/wiki/Q17148646","display_name":"Multiple baseline design","level":3,"score":0.26260000467300415}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/tip.2020.2967584","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tip.2020.2967584","pdf_url":"https://ieeexplore.ieee.org/ielx7/83/8835130/08967238.pdf","source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},{"id":"pmid:31995489","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/31995489","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on image processing : a publication of the IEEE Signal Processing Society","raw_type":null},{"id":"pmh:oai:arXiv.org:1904.04166","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1904.04166","pdf_url":"https://arxiv.org/pdf/1904.04166","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"doi:10.1109/tip.2020.2967584","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tip.2020.2967584","pdf_url":"https://ieeexplore.ieee.org/ielx7/83/8835130/08967238.pdf","source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2927812634.pdf","grobid_xml":"https://content.openalex.org/works/W2927812634.grobid-xml"},"referenced_works_count":49,"referenced_works":["https://openalex.org/W1488766761","https://openalex.org/W1969483458","https://openalex.org/W2055600015","https://openalex.org/W2064675550","https://openalex.org/W2069830673","https://openalex.org/W2119717200","https://openalex.org/W2125409550","https://openalex.org/W2142192571","https://openalex.org/W2277195237","https://openalex.org/W2508497007","https://openalex.org/W2557465155","https://openalex.org/W2560730294","https://openalex.org/W2560920409","https://openalex.org/W2563399268","https://openalex.org/W2585954273","https://openalex.org/W2593841437","https://openalex.org/W2735159761","https://openalex.org/W2745461083","https://openalex.org/W2795832645","https://openalex.org/W2798708692","https://openalex.org/W2798786641","https://openalex.org/W2883630736","https://openalex.org/W2887978863","https://openalex.org/W2899747753","https://openalex.org/W2962684798","https://openalex.org/W2962749469","https://openalex.org/W2963109634","https://openalex.org/W2963383024","https://openalex.org/W2963447367","https://openalex.org/W2963656855","https://openalex.org/W2964487155","https://openalex.org/W2972113750","https://openalex.org/W6631190155","https://openalex.org/W6638523607","https://openalex.org/W6640296258","https://openalex.org/W6685322675","https://openalex.org/W6686883664","https://openalex.org/W6719057275","https://openalex.org/W6729556111","https://openalex.org/W6731334075","https://openalex.org/W6735003056","https://openalex.org/W6736769356","https://openalex.org/W6738165965","https://openalex.org/W6743790455","https://openalex.org/W6746518932","https://openalex.org/W6747912417","https://openalex.org/W6756040250","https://openalex.org/W6756121852","https://openalex.org/W6756881225"],"related_works":[],"abstract_inverted_index":{"In":[0,49,98],"Embodied":[1],"Question":[2],"Answering":[3],"(EmbodiedQA),":[4],"an":[5,9,70,78],"agent":[6,79,114],"interacts":[7],"with":[8],"environment":[10,91],"to":[11,83,88,120,145],"gather":[12],"necessary":[13],"information":[14],"for":[15,45,75],"answering":[16],"user":[17],"questions.":[18,97],"Existing":[19],"works":[20],"have":[21],"laid":[22],"a":[23,60,81,89,105,117,160],"solid":[24],"foundation":[25],"towards":[26],"solving":[27],"this":[28,50,55,99],"interesting":[29],"problem.":[30],"But":[31],"the":[32,46,85,113,122,126,130,135,148,153],"current":[33],"performance,":[34],"especially":[35],"in":[36,108,147,157,163],"navigation,":[37],"suggests":[38],"that":[39,65],"EmbodiedQA":[40,76,131],"might":[41],"be":[42],"too":[43],"challenging":[44],"contemporary":[47],"approaches.":[48],"paper,":[51],"we":[52,102,151],"empirically":[53],"study":[54],"problem":[56],"and":[57,72,111],"introduce":[58],"1)":[59],"simple":[61,139],"yet":[62],"effective":[63],"baseline":[64,140],"achieves":[66,141],"promising":[67],"performance;":[68],"2)":[69],"easier":[71],"practical":[73],"setting":[74],"where":[77],"has":[80],"chance":[82],"adapt":[84],"trained":[86,127],"model":[87],"new":[90,100,109,149],"before":[92],"it":[93],"actually":[94],"answers":[95],"users":[96],"setting,":[101,137,150],"randomly":[103],"place":[104],"few":[106],"objects":[107],"environments,":[110],"upgrade":[112],"policy":[115],"by":[116],"distillation":[118],"network":[119],"retain":[121],"generalization":[123],"ability":[124],"from":[125],"model.":[128],"On":[129],"v1":[132],"benchmark,":[133],"under":[134],"standard":[136],"our":[138],"very":[142],"competitive":[143],"results":[144],"the-state-of-the-art;":[146],"found":[152],"introduced":[154],"small":[155],"change":[156],"settings":[158],"yields":[159],"notable":[161],"gain":[162],"navigation.":[164]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":7},{"year":2020,"cited_by_count":8}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2019-04-11T00:00:00"}
