{"id":"https://openalex.org/W2765947428","doi":"https://doi.org/10.1145/3132515.3132522","title":"Image Captioning in the Wild","display_name":"Image Captioning in the Wild","publication_year":2017,"publication_date":"2017-10-23","ids":{"openalex":"https://openalex.org/W2765947428","doi":"https://doi.org/10.1145/3132515.3132522","mag":"2765947428"},"language":"en","primary_location":{"id":"doi:10.1145/3132515.3132522","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3132515.3132522","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Workshop on Multimodal Understanding of Social, Affective and Subjective Attributes","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020380115","display_name":"Philipp Blandfort","orcid":"https://orcid.org/0000-0002-1516-3780"},"institutions":[{"id":"https://openalex.org/I33256026","display_name":"German Research Centre for Artificial Intelligence","ror":"https://ror.org/01ayc5b57","country_code":"DE","type":"funder","lineage":["https://openalex.org/I33256026"]},{"id":"https://openalex.org/I153267046","display_name":"University of Kaiserslautern","ror":"https://ror.org/04zrf7b53","country_code":"DE","type":"education","lineage":["https://openalex.org/I153267046"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Philipp Blandfort","raw_affiliation_strings":["German Institute for Artificial Intelligence &amp; University of Kaiserslautern, Kaiserslautern, Germany"],"affiliations":[{"raw_affiliation_string":"German Institute for Artificial Intelligence &amp; University of Kaiserslautern, Kaiserslautern, Germany","institution_ids":["https://openalex.org/I33256026","https://openalex.org/I153267046"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029350364","display_name":"Tushar Karayil","orcid":null},"institutions":[{"id":"https://openalex.org/I33256026","display_name":"German Research Centre for Artificial Intelligence","ror":"https://ror.org/01ayc5b57","country_code":"DE","type":"funder","lineage":["https://openalex.org/I33256026"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Tushar Karayil","raw_affiliation_strings":["German Institute for Artificial Intelligence, Kaiserslautern, Germany"],"affiliations":[{"raw_affiliation_string":"German Institute for Artificial Intelligence, Kaiserslautern, Germany","institution_ids":["https://openalex.org/I33256026"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065722787","display_name":"Damian Borth","orcid":"https://orcid.org/0000-0002-4660-2627"},"institutions":[{"id":"https://openalex.org/I33256026","display_name":"German Research Centre for Artificial Intelligence","ror":"https://ror.org/01ayc5b57","country_code":"DE","type":"funder","lineage":["https://openalex.org/I33256026"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Damian Borth","raw_affiliation_strings":["German Institute for Artificial Intelligence, Kaiserslautern, Germany"],"affiliations":[{"raw_affiliation_string":"German Institute for Artificial Intelligence, Kaiserslautern, Germany","institution_ids":["https://openalex.org/I33256026"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101904182","display_name":"Andreas Dengel","orcid":"https://orcid.org/0000-0002-6100-8255"},"institutions":[{"id":"https://openalex.org/I33256026","display_name":"German Research Centre for Artificial Intelligence","ror":"https://ror.org/01ayc5b57","country_code":"DE","type":"funder","lineage":["https://openalex.org/I33256026"]},{"id":"https://openalex.org/I153267046","display_name":"University of Kaiserslautern","ror":"https://ror.org/04zrf7b53","country_code":"DE","type":"education","lineage":["https://openalex.org/I153267046"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Andreas Dengel","raw_affiliation_strings":["German Institute for Artificial Intelligence &amp; University of Kaiserslautern, Kaiserslautern, Germany"],"affiliations":[{"raw_affiliation_string":"German Institute for Artificial Intelligence &amp; University of Kaiserslautern, Kaiserslautern, Germany","institution_ids":["https://openalex.org/I33256026","https://openalex.org/I153267046"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5020380115"],"corresponding_institution_ids":["https://openalex.org/I153267046","https://openalex.org/I33256026"],"apc_list":null,"apc_paid":null,"fwci":0.182,"has_fulltext":false,"cited_by_count":11,"citation_normalized_percentile":{"value":0.57760706,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"21","last_page":"29"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.993399977684021,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9918000102043152,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.9446041584014893},{"id":"https://openalex.org/keywords/crowdsourcing","display_name":"Crowdsourcing","score":0.8109697103500366},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7853368520736694},{"id":"https://openalex.org/keywords/publication","display_name":"Publication","score":0.5986137390136719},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5769500732421875},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5649689435958862},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.5517714023590088},{"id":"https://openalex.org/keywords/visibility","display_name":"Visibility","score":0.5270001292228699},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5107071995735168},{"id":"https://openalex.org/keywords/dimension","display_name":"Dimension (graph theory)","score":0.5071005821228027},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4396752119064331},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3705483078956604},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.32003551721572876},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.2871212661266327}],"concepts":[{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.9446041584014893},{"id":"https://openalex.org/C62230096","wikidata":"https://www.wikidata.org/wiki/Q275969","display_name":"Crowdsourcing","level":2,"score":0.8109697103500366},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7853368520736694},{"id":"https://openalex.org/C41458344","wikidata":"https://www.wikidata.org/wiki/Q732577","display_name":"Publication","level":2,"score":0.5986137390136719},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5769500732421875},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5649689435958862},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.5517714023590088},{"id":"https://openalex.org/C123403432","wikidata":"https://www.wikidata.org/wiki/Q654068","display_name":"Visibility","level":2,"score":0.5270001292228699},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5107071995735168},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.5071005821228027},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4396752119064331},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3705483078956604},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.32003551721572876},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.2871212661266327},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C112698675","wikidata":"https://www.wikidata.org/wiki/Q37038","display_name":"Advertising","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3132515.3132522","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3132515.3132522","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Workshop on Multimodal Understanding of Social, Affective and Subjective Attributes","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2835247932","display_name":null,"funder_award_id":"MOM: 01WI15002","funder_id":"https://openalex.org/F4320321114","funder_display_name":"Bundesministerium f\u00fcr Bildung und Forschung"},{"id":"https://openalex.org/G638475303","display_name":null,"funder_award_id":"NVAIL","funder_id":"https://openalex.org/F4320309480","funder_display_name":"Nvidia"}],"funders":[{"id":"https://openalex.org/F4320309480","display_name":"Nvidia","ror":"https://ror.org/03jdj4y14"},{"id":"https://openalex.org/F4320321114","display_name":"Bundesministerium f\u00fcr Bildung und Forschung","ror":"https://ror.org/04pz7b180"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W203719604","https://openalex.org/W1629950035","https://openalex.org/W1773149199","https://openalex.org/W1895577753","https://openalex.org/W1931639407","https://openalex.org/W1966633684","https://openalex.org/W1972846045","https://openalex.org/W2041076459","https://openalex.org/W2057519640","https://openalex.org/W2085417874","https://openalex.org/W2123749709","https://openalex.org/W2143017621","https://openalex.org/W2250384498","https://openalex.org/W2264742718","https://openalex.org/W2524558894","https://openalex.org/W2525668096","https://openalex.org/W2530811251","https://openalex.org/W2531468424","https://openalex.org/W6603094881"],"related_works":["https://openalex.org/W4210416330","https://openalex.org/W2775506363","https://openalex.org/W3088136942","https://openalex.org/W3032998312","https://openalex.org/W135177976","https://openalex.org/W4290852288","https://openalex.org/W2949362007","https://openalex.org/W4283207562","https://openalex.org/W2963177403","https://openalex.org/W2330246314"],"abstract_inverted_index":{"Automatic":[0],"image":[1,100],"captioning":[2],"is":[3,19,52],"a":[4,33,44,61],"well-known":[5],"problem":[6,16,51],"in":[7,43,99],"the":[8,50,68,91,97,105,114],"field":[9],"of":[10,35,49,67],"artificial":[11],"intelligence.":[12],"To":[13,55],"solve":[14],"this":[15,57],"efficiently,":[17],"it":[18],"also":[20],"required":[21],"to":[22,40,83,94],"understand":[23,56],"how":[24],"people":[25],"caption":[26],"images":[27],"naturally":[28],"(when":[29],"not":[30],"instructed":[31],"by":[32],"set":[34],"rules,":[36],"which":[37],"tell":[38],"them":[39],"do":[41],"so":[42],"certain":[45],"way).":[46],"This":[47],"dimension":[48],"rarely":[53],"discussed.":[54],"aspect,":[58],"we":[59],"performed":[60],"crowdsourcing":[62],"study":[63],"on":[64],"specific":[65],"subsets":[66],"Yahoo":[69],"Flickr":[70],"Creative":[71],"Commons":[72],"100":[73],"Million":[74],"Dataset":[75],"(YFCC100M)":[76],"where":[77],"annotators":[78],"evaluate":[79],"captions":[80,101],"with":[81,113],"respect":[82],"subjectivity,":[84],"visibility,":[85],"appeal":[86],"and":[87],"intent.":[88],"We":[89,107],"use":[90],"resulting":[92],"data":[93],"systematically":[95],"characterize":[96],"variations":[98],"that":[102],"appear":[103],"\"in":[104],"wild\".":[106],"publish":[108],"our":[109],"findings":[110],"here":[111],"along":[112],"annotated":[115],"dataset.":[116]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":4},{"year":2019,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
