{"id":"https://openalex.org/W2984375830","doi":"https://doi.org/10.18653/v1/k19-1040","title":"Leveraging Past References for Robust Language Grounding","display_name":"Leveraging Past References for Robust Language Grounding","publication_year":2019,"publication_date":"2019-01-01","ids":{"openalex":"https://openalex.org/W2984375830","doi":"https://doi.org/10.18653/v1/k19-1040","mag":"2984375830"},"language":"en","primary_location":{"id":"doi:10.18653/v1/k19-1040","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/k19-1040","pdf_url":"https://www.aclweb.org/anthology/K19-1040.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 23rd Conference on Computational Natural Language Learning (CoNLL)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/K19-1040.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041779935","display_name":"Subhro Roy","orcid":null},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Subhro Roy","raw_affiliation_strings":["Computer Science and Artificial Intelligence Laboratory Massachusetts Institute of Technology"],"affiliations":[{"raw_affiliation_string":"Computer Science and Artificial Intelligence Laboratory Massachusetts Institute of Technology","institution_ids":["https://openalex.org/I63966007"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074228294","display_name":"Michael D. Noseworthy","orcid":"https://orcid.org/0000-0003-1464-159X"},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Michael Noseworthy","raw_affiliation_strings":["Computer Science and Artificial Intelligence Laboratory Massachusetts Institute of Technology"],"affiliations":[{"raw_affiliation_string":"Computer Science and Artificial Intelligence Laboratory Massachusetts Institute of Technology","institution_ids":["https://openalex.org/I63966007"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002249903","display_name":"Rohan Paul","orcid":"https://orcid.org/0000-0002-6733-1766"},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rohan Paul","raw_affiliation_strings":["Computer Science and Artificial Intelligence Laboratory Massachusetts Institute of Technology"],"affiliations":[{"raw_affiliation_string":"Computer Science and Artificial Intelligence Laboratory Massachusetts Institute of Technology","institution_ids":["https://openalex.org/I63966007"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074295573","display_name":"Daehyung Park","orcid":"https://orcid.org/0000-0002-1287-9433"},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Daehyung Park","raw_affiliation_strings":["Computer Science and Artificial Intelligence Laboratory Massachusetts Institute of Technology"],"affiliations":[{"raw_affiliation_string":"Computer Science and Artificial Intelligence Laboratory Massachusetts Institute of Technology","institution_ids":["https://openalex.org/I63966007"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5004980809","display_name":"Nicholas Roy","orcid":"https://orcid.org/0000-0002-4277-2928"},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nicholas Roy","raw_affiliation_strings":["Computer Science and Artificial Intelligence Laboratory Massachusetts Institute of Technology"],"affiliations":[{"raw_affiliation_string":"Computer Science and Artificial Intelligence Laboratory Massachusetts Institute of Technology","institution_ids":["https://openalex.org/I63966007"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5041779935"],"corresponding_institution_ids":["https://openalex.org/I63966007"],"apc_list":null,"apc_paid":null,"fwci":0.5108,"has_fulltext":true,"cited_by_count":9,"citation_normalized_percentile":{"value":0.70174028,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/coreference","display_name":"Coreference","score":0.8379148244857788},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.800915002822876},{"id":"https://openalex.org/keywords/ground","display_name":"Ground","score":0.7968196272850037},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.6434662342071533},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6370925307273865},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.5476894378662109},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5212660431861877},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.44723019003868103},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.44396013021469116},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4028928577899933},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.38361671566963196},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.298056423664093},{"id":"https://openalex.org/keywords/resolution","display_name":"Resolution (logic)","score":0.1707865595817566},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.08689123392105103},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.07148441672325134}],"concepts":[{"id":"https://openalex.org/C28076734","wikidata":"https://www.wikidata.org/wiki/Q63087","display_name":"Coreference","level":3,"score":0.8379148244857788},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.800915002822876},{"id":"https://openalex.org/C168993435","wikidata":"https://www.wikidata.org/wiki/Q6501125","display_name":"Ground","level":2,"score":0.7968196272850037},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.6434662342071533},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6370925307273865},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.5476894378662109},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5212660431861877},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.44723019003868103},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.44396013021469116},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4028928577899933},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.38361671566963196},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.298056423664093},{"id":"https://openalex.org/C138268822","wikidata":"https://www.wikidata.org/wiki/Q1051925","display_name":"Resolution (logic)","level":2,"score":0.1707865595817566},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.08689123392105103},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.07148441672325134},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.18653/v1/k19-1040","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/k19-1040","pdf_url":"https://www.aclweb.org/anthology/K19-1040.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 23rd Conference on Computational Natural Language Learning (CoNLL)","raw_type":"proceedings-article"},{"id":"pmh:oai:dspace.mit.edu:1721.1/137308","is_oa":true,"landing_page_url":"https://hdl.handle.net/1721.1/137308","pdf_url":null,"source":{"id":"https://openalex.org/S4306400425","display_name":"DSpace@MIT (Massachusetts Institute of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I63966007","host_organization_name":"Massachusetts Institute of Technology","host_organization_lineage":["https://openalex.org/I63966007"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Association for Computational Linguistics","raw_type":"http://purl.org/eprint/type/ConferencePaper"}],"best_oa_location":{"id":"doi:10.18653/v1/k19-1040","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/k19-1040","pdf_url":"https://www.aclweb.org/anthology/K19-1040.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 23rd Conference on Computational Natural Language Learning (CoNLL)","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320315934","display_name":"Toyota Research Institute","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2984375830.pdf","grobid_xml":"https://content.openalex.org/works/W2984375830.grobid-xml"},"referenced_works_count":34,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1686810756","https://openalex.org/W1861492603","https://openalex.org/W2064675550","https://openalex.org/W2089652186","https://openalex.org/W2110930288","https://openalex.org/W2117130368","https://openalex.org/W2159398820","https://openalex.org/W2250539671","https://openalex.org/W2293700449","https://openalex.org/W2294505934","https://openalex.org/W2489434015","https://openalex.org/W2558535589","https://openalex.org/W2576920940","https://openalex.org/W2597655663","https://openalex.org/W2736923367","https://openalex.org/W2768661419","https://openalex.org/W2773391718","https://openalex.org/W2788810331","https://openalex.org/W2892245540","https://openalex.org/W2899771611","https://openalex.org/W2902699874","https://openalex.org/W2952316487","https://openalex.org/W2962700105","https://openalex.org/W2962835968","https://openalex.org/W2963109634","https://openalex.org/W2963244312","https://openalex.org/W2963386218","https://openalex.org/W2963499246","https://openalex.org/W2963918774","https://openalex.org/W2964121744","https://openalex.org/W2964284374","https://openalex.org/W4249803144","https://openalex.org/W4295803813"],"related_works":["https://openalex.org/W2139373276","https://openalex.org/W2227889443","https://openalex.org/W4385749782","https://openalex.org/W3167631113","https://openalex.org/W2765988220","https://openalex.org/W2145164276","https://openalex.org/W2004630825","https://openalex.org/W2732813147","https://openalex.org/W2143460112","https://openalex.org/W4292830139"],"abstract_inverted_index":{"Grounding":[0],"referring":[1,37,48,73,86,101],"expressions":[2,38,71,87],"to":[3,27,74,88,108,129,137],"objects":[4,40,110],"in":[5,17,148],"an":[6,105],"environment":[7],"has":[8],"traditionally":[9],"been":[10],"considered":[11],"a":[12,34,64],"one-off,":[13],"ahistorical":[14],"task.":[15],"However,":[16],"realistic":[18],"applications":[19],"of":[20,31,59],"grounding,":[21],"multiple":[22],"users":[23],"will":[24],"repeatedly":[25],"refer":[26],"the":[28,53,57,75,127,134,149],"same":[29,76],"set":[30],"objects.":[32],"As":[33],"result,":[35],"past":[36,85],"for":[39,45],"can":[41],"provide":[42],"strong":[43],"signals":[44],"grounding":[46,54,119,135],"subsequent":[47],"expressions.":[49],"We":[50,124],"therefore":[51],"reframe":[52],"problem":[55],"from":[56,82],"perspective":[58],"coreference":[60,103,132],"detection":[61],"and":[62,84],"propose":[63],"neural":[65],"network":[66,79],"that":[67,99],"detects":[68],"when":[69,141],"two":[70],"are":[72],"object.":[77],"The":[78],"combines":[80],"information":[81],"vision":[83],"resolve":[89],"which":[90,116],"object":[91,131,144],"is":[92,104],"being":[93],"referred":[94],"to.":[95],"Our":[96],"experiments":[97],"show":[98,126],"detecting":[100],"expression":[102],"effective":[106],"way":[107],"ground":[109],"described":[111],"by":[112],"subtle":[113],"visual":[114,118],"properties,":[115],"standard":[117],"models":[120],"have":[121],"difficulty":[122],"capturing.":[123],"also":[125],"ability":[128],"detect":[130],"allows":[133],"model":[136],"perform":[138],"well":[139],"even":[140],"it":[142],"encounters":[143],"categories":[145],"not":[146],"seen":[147],"training":[150],"data.":[151]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":3}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
