{"id":"https://openalex.org/W2904579814","doi":"https://doi.org/10.1609/aaai.v33i01.33015781","title":"Learning to Communicate and Solve Visual Blocks-World Tasks","display_name":"Learning to Communicate and Solve Visual Blocks-World Tasks","publication_year":2019,"publication_date":"2019-07-17","ids":{"openalex":"https://openalex.org/W2904579814","doi":"https://doi.org/10.1609/aaai.v33i01.33015781","mag":"2904579814"},"language":"en","primary_location":{"id":"doi:10.1609/aaai.v33i01.33015781","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v33i01.33015781","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/4525/4403","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/4525/4403","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100360372","display_name":"Qi Zhang","orcid":"https://orcid.org/0000-0002-8562-5987"},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Qi Zhang","raw_affiliation_strings":["University of Michigan"],"affiliations":[{"raw_affiliation_string":"University of Michigan","institution_ids":["https://openalex.org/I27837315"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077109450","display_name":"Richard L. Lewis","orcid":"https://orcid.org/0000-0001-6403-489X"},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Richard Lewis","raw_affiliation_strings":["University of Michigan"],"affiliations":[{"raw_affiliation_string":"University of Michigan","institution_ids":["https://openalex.org/I27837315"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103117754","display_name":"Satinder Singh","orcid":"https://orcid.org/0000-0002-8215-8295"},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Satinder Singh","raw_affiliation_strings":["University of Michigan"],"affiliations":[{"raw_affiliation_string":"University of Michigan","institution_ids":["https://openalex.org/I27837315"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5061747257","display_name":"Edmund H. Durfee","orcid":"https://orcid.org/0000-0002-1045-3690"},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Edmund Durfee","raw_affiliation_strings":["University of Michigan"],"affiliations":[{"raw_affiliation_string":"University of Michigan","institution_ids":["https://openalex.org/I27837315"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100360372"],"corresponding_institution_ids":["https://openalex.org/I27837315"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"33","issue":"01","first_page":"5781","last_page":"5788"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12090","display_name":"Language and cultural evolution","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/3316","display_name":"Cultural Studies"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12090","display_name":"Language and cultural evolution","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/3316","display_name":"Cultural Studies"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7431066036224365},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.7131564021110535},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6560191512107849},{"id":"https://openalex.org/keywords/utterance","display_name":"Utterance","score":0.625958263874054},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.6106647849082947},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5627925395965576},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.5440711975097656},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.49174097180366516},{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.47590598464012146},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.4383261203765869},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.4335898160934448},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4294441044330597},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.36731794476509094},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.36044883728027344},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.12565889954566956}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7431066036224365},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.7131564021110535},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6560191512107849},{"id":"https://openalex.org/C2775852435","wikidata":"https://www.wikidata.org/wiki/Q258403","display_name":"Utterance","level":2,"score":0.625958263874054},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.6106647849082947},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5627925395965576},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.5440711975097656},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49174097180366516},{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.47590598464012146},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.4383261203765869},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.4335898160934448},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4294441044330597},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.36731794476509094},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.36044883728027344},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.12565889954566956},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v33i01.33015781","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v33i01.33015781","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/4525/4403","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v33i01.33015781","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v33i01.33015781","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/4525/4403","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.7900000214576721}],"awards":[{"id":"https://openalex.org/G1523888516","display_name":null,"funder_award_id":"FA9550-","funder_id":"https://openalex.org/F4320338279","funder_display_name":"Air Force Office of Scientific Research"},{"id":"https://openalex.org/G4818823069","display_name":null,"funder_award_id":"FA9550-15-1-0039","funder_id":"https://openalex.org/F4320338279","funder_display_name":"Air Force Office of Scientific Research"},{"id":"https://openalex.org/G5809100787","display_name":null,"funder_award_id":"FA9550","funder_id":"https://openalex.org/F4320338279","funder_display_name":"Air Force Office of Scientific Research"}],"funders":[{"id":"https://openalex.org/F4320338279","display_name":"Air Force Office of Scientific Research","ror":"https://ror.org/011e9bt93"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2904579814.pdf","grobid_xml":"https://content.openalex.org/works/W2904579814.grobid-xml"},"referenced_works_count":23,"referenced_works":["https://openalex.org/W98006832","https://openalex.org/W1967449835","https://openalex.org/W2018139470","https://openalex.org/W2046104360","https://openalex.org/W2083568566","https://openalex.org/W2120409145","https://openalex.org/W2395575420","https://openalex.org/W2460440635","https://openalex.org/W2547875792","https://openalex.org/W2602275733","https://openalex.org/W2604329066","https://openalex.org/W2621379712","https://openalex.org/W2795890674","https://openalex.org/W2963000099","https://openalex.org/W2963681240","https://openalex.org/W2964338167","https://openalex.org/W4295846245","https://openalex.org/W4298090669","https://openalex.org/W6641909454","https://openalex.org/W6654666479","https://openalex.org/W6662067854","https://openalex.org/W6671211810","https://openalex.org/W7025320856"],"related_works":["https://openalex.org/W4210416330","https://openalex.org/W3088136942","https://openalex.org/W2949362007","https://openalex.org/W2775506363","https://openalex.org/W4290852288","https://openalex.org/W4388893791","https://openalex.org/W4283207562","https://openalex.org/W2963177403","https://openalex.org/W2330246314","https://openalex.org/W2949522393"],"abstract_inverted_index":{"We":[0],"study":[1],"emergent":[2,88,100],"communication":[3,89],"between":[4],"speaker":[5,30],"and":[6,35,69,94,109,118,121],"listener":[7,49],"recurrent":[8],"neural-network":[9],"agents":[10],"that":[11,90,136],"are":[12,78,137],"tasked":[13],"to":[14,37,51],"cooperatively":[15],"construct":[16,52],"a":[17,23,39,45,53,62,83],"blocks-world":[18,54],"target":[19,33],"image":[20,34,55,71],"sampled":[21],"from":[22,44,139],"generative":[24],"grammar":[25],"of":[26,41,64,72,82,98,106,112,127],"blocks":[27],"configurations.":[28],"The":[29,48],"receives":[31],"the":[32,65,70,73,80,99,107,125,132,140],"learns":[36,50],"emit":[38],"sequence":[40],"discrete":[42],"symbols":[43],"fixed":[46],"vocabulary.":[47],"by":[56],"choosing":[57],"block":[58],"placement":[59],"actions":[60],"as":[61],"function":[63],"speaker\u2019s":[66],"full":[67],"utterance":[68],"ongoing":[74],"construction.":[75],"Our":[76],"contributions":[77],"(a)":[79],"introduction":[81],"task":[84],"domain":[85],"for":[86,124],"studying":[87],"is":[91],"both":[92],"challenging":[93],"affords":[95],"useful":[96],"analyses":[97],"protocols;":[101],"(b)":[102],"an":[103],"empirical":[104],"comparison":[105],"interpolation":[108],"extrapolation":[110],"performance":[111],"training":[113],"via":[114],"supervised,":[115],"(contextual)":[116],"Bandit,":[117],"reinforcement":[119],"learning;":[120],"(c)":[122],"evidence":[123],"emergence":[126],"interesting":[128],"linguistic":[129],"properties":[130],"in":[131],"RL":[133],"agent":[134],"protocol":[135],"distinct":[138],"other":[141],"two.":[142]},"counts_by_year":[],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
