{"id":"https://openalex.org/W2970013683","doi":"https://doi.org/10.18653/v1/d19-1155","title":"Decoupled Box Proposal and Featurization with Ultrafine-Grained Semantic Labels Improve Image Captioning and Visual Question Answering","display_name":"Decoupled Box Proposal and Featurization with Ultrafine-Grained Semantic Labels Improve Image Captioning and Visual Question Answering","publication_year":2019,"publication_date":"2019-01-01","ids":{"openalex":"https://openalex.org/W2970013683","doi":"https://doi.org/10.18653/v1/d19-1155","mag":"2970013683"},"language":"en","primary_location":{"id":"doi:10.18653/v1/d19-1155","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/d19-1155","pdf_url":"https://www.aclweb.org/anthology/D19-1155.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing (EMNLP-IJCNLP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/D19-1155.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075518871","display_name":"Soravit Changpinyo","orcid":"https://orcid.org/0000-0002-4013-1190"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Soravit Changpinyo","raw_affiliation_strings":["Google AI Venice, CA 90291"],"affiliations":[{"raw_affiliation_string":"Google AI Venice, CA 90291","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101799605","display_name":"Bo Pang","orcid":"https://orcid.org/0000-0003-4521-6369"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Bo Pang","raw_affiliation_strings":["Google AI Venice, CA 90291"],"affiliations":[{"raw_affiliation_string":"Google AI Venice, CA 90291","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100679058","display_name":"Piyush Sharma","orcid":"https://orcid.org/0009-0003-0372-4303"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Piyush Sharma","raw_affiliation_strings":["Google AI Venice, CA 90291"],"affiliations":[{"raw_affiliation_string":"Google AI Venice, CA 90291","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5089152779","display_name":"Radu Soricut","orcid":"https://orcid.org/0000-0003-1565-3365"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Radu Soricut","raw_affiliation_strings":["Google AI Venice, CA 90291"],"affiliations":[{"raw_affiliation_string":"Google AI Venice, CA 90291","institution_ids":["https://openalex.org/I1291425158"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5075518871"],"corresponding_institution_ids":["https://openalex.org/I1291425158"],"apc_list":null,"apc_paid":null,"fwci":1.6195,"has_fulltext":true,"cited_by_count":18,"citation_normalized_percentile":{"value":0.87261197,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1468","last_page":"1474"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.8576171398162842},{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.8366456627845764},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7438832521438599},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.5765156745910645},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5682782530784607},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4926770329475403},{"id":"https://openalex.org/keywords/empirical-research","display_name":"Empirical research","score":0.43828269839286804},{"id":"https://openalex.org/keywords/natural","display_name":"Natural (archaeology)","score":0.43718820810317993},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.3861226439476013},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3841100335121155},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09129694104194641},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.06391477584838867}],"concepts":[{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.8576171398162842},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.8366456627845764},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7438832521438599},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.5765156745910645},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5682782530784607},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4926770329475403},{"id":"https://openalex.org/C120936955","wikidata":"https://www.wikidata.org/wiki/Q2155640","display_name":"Empirical research","level":2,"score":0.43828269839286804},{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.43718820810317993},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3861226439476013},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3841100335121155},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09129694104194641},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.06391477584838867},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/d19-1155","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/d19-1155","pdf_url":"https://www.aclweb.org/anthology/D19-1155.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing (EMNLP-IJCNLP)","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/d19-1155","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/d19-1155","pdf_url":"https://www.aclweb.org/anthology/D19-1155.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing (EMNLP-IJCNLP)","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.8199999928474426,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2970013683.pdf","grobid_xml":"https://content.openalex.org/works/W2970013683.grobid-xml"},"referenced_works_count":46,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1514535095","https://openalex.org/W1575833922","https://openalex.org/W1861492603","https://openalex.org/W1933349210","https://openalex.org/W1956340063","https://openalex.org/W2102381086","https://openalex.org/W2108325777","https://openalex.org/W2117539524","https://openalex.org/W2153579005","https://openalex.org/W2194775991","https://openalex.org/W2277195237","https://openalex.org/W2506483933","https://openalex.org/W2520135321","https://openalex.org/W2560645892","https://openalex.org/W2560730294","https://openalex.org/W2563399268","https://openalex.org/W2564898401","https://openalex.org/W2570343428","https://openalex.org/W2613718673","https://openalex.org/W2745461083","https://openalex.org/W2767566874","https://openalex.org/W2787119853","https://openalex.org/W2795151422","https://openalex.org/W2884093133","https://openalex.org/W2886641317","https://openalex.org/W2895135219","https://openalex.org/W2907258563","https://openalex.org/W2916754336","https://openalex.org/W2938082352","https://openalex.org/W2962731754","https://openalex.org/W2962749469","https://openalex.org/W2962843773","https://openalex.org/W2963088515","https://openalex.org/W2963403868","https://openalex.org/W2963622213","https://openalex.org/W2963703197","https://openalex.org/W2963907629","https://openalex.org/W2963927307","https://openalex.org/W2964067226","https://openalex.org/W2964115968","https://openalex.org/W2988916019","https://openalex.org/W3016211260","https://openalex.org/W4294170691","https://openalex.org/W4385245566","https://openalex.org/W4388152766"],"related_works":["https://openalex.org/W3157284875","https://openalex.org/W2259406085","https://openalex.org/W3009270862","https://openalex.org/W2099715052","https://openalex.org/W4226247999","https://openalex.org/W4213176082","https://openalex.org/W2187398150","https://openalex.org/W3209772662","https://openalex.org/W4200629926","https://openalex.org/W4220955952"],"abstract_inverted_index":{"Soravit":[0],"Changpinyo,":[1],"Bo":[2],"Pang,":[3],"Piyush":[4],"Sharma,":[5],"Radu":[6],"Soricut.":[7],"Proceedings":[8],"of":[9],"the":[10,21],"2019":[11],"Conference":[12,25],"on":[13,26],"Empirical":[14],"Methods":[15],"in":[16],"Natural":[17,27],"Language":[18,28],"Processing":[19,29],"and":[20],"9th":[22],"International":[23],"Joint":[24],"(EMNLP-IJCNLP).":[30],"2019.":[31]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":9},{"year":2020,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
