{"id":"https://openalex.org/W2955620508","doi":"https://doi.org/10.1109/tmm.2019.2924598","title":"The Role of the Input in Natural Language Video Description","display_name":"The Role of the Input in Natural Language Video Description","publication_year":2019,"publication_date":"2019-06-25","ids":{"openalex":"https://openalex.org/W2955620508","doi":"https://doi.org/10.1109/tmm.2019.2924598","mag":"2955620508"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2019.2924598","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2019.2924598","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://hdl.handle.net/11380/1200034","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041010671","display_name":"Silvia Cascianelli","orcid":"https://orcid.org/0000-0001-7885-6050"},"institutions":[{"id":"https://openalex.org/I27483092","display_name":"University of Perugia","ror":"https://ror.org/00x27da85","country_code":"IT","type":"education","lineage":["https://openalex.org/I27483092"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Silvia Cascianelli","raw_affiliation_strings":["Department of Engineering, University of Perugia, Perugia, Italy"],"raw_orcid":"https://orcid.org/0000-0001-7885-6050","affiliations":[{"raw_affiliation_string":"Department of Engineering, University of Perugia, Perugia, Italy","institution_ids":["https://openalex.org/I27483092"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016925926","display_name":"Gabriele Costante","orcid":"https://orcid.org/0000-0002-8417-9372"},"institutions":[{"id":"https://openalex.org/I27483092","display_name":"University of Perugia","ror":"https://ror.org/00x27da85","country_code":"IT","type":"education","lineage":["https://openalex.org/I27483092"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Gabriele Costante","raw_affiliation_strings":["Department of Engineering, University of Perugia, Perugia, Italy"],"raw_orcid":"https://orcid.org/0000-0002-8417-9372","affiliations":[{"raw_affiliation_string":"Department of Engineering, University of Perugia, Perugia, Italy","institution_ids":["https://openalex.org/I27483092"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060209685","display_name":"Alessandro Devo","orcid":"https://orcid.org/0000-0001-7522-6264"},"institutions":[{"id":"https://openalex.org/I27483092","display_name":"University of Perugia","ror":"https://ror.org/00x27da85","country_code":"IT","type":"education","lineage":["https://openalex.org/I27483092"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Alessandro Devo","raw_affiliation_strings":["Department of Engineering, University of Perugia, Perugia, Italy"],"raw_orcid":"https://orcid.org/0000-0001-7522-6264","affiliations":[{"raw_affiliation_string":"Department of Engineering, University of Perugia, Perugia, Italy","institution_ids":["https://openalex.org/I27483092"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023897603","display_name":"Thomas A. Ciarfuglia","orcid":"https://orcid.org/0000-0001-8646-8197"},"institutions":[{"id":"https://openalex.org/I27483092","display_name":"University of Perugia","ror":"https://ror.org/00x27da85","country_code":"IT","type":"education","lineage":["https://openalex.org/I27483092"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Thomas A. Ciarfuglia","raw_affiliation_strings":["Department of Engineering, University of Perugia, Perugia, Italy"],"raw_orcid":"https://orcid.org/0000-0001-8646-8197","affiliations":[{"raw_affiliation_string":"Department of Engineering, University of Perugia, Perugia, Italy","institution_ids":["https://openalex.org/I27483092"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066104170","display_name":"Paolo Valigi","orcid":"https://orcid.org/0000-0002-0486-7678"},"institutions":[{"id":"https://openalex.org/I27483092","display_name":"University of Perugia","ror":"https://ror.org/00x27da85","country_code":"IT","type":"education","lineage":["https://openalex.org/I27483092"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Paolo Valigi","raw_affiliation_strings":["Department of Engineering, University of Perugia, Perugia, Italy"],"raw_orcid":"https://orcid.org/0000-0002-0486-7678","affiliations":[{"raw_affiliation_string":"Department of Engineering, University of Perugia, Perugia, Italy","institution_ids":["https://openalex.org/I27483092"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5057733793","display_name":"Mario Luca Fravolini","orcid":"https://orcid.org/0000-0002-3104-8782"},"institutions":[{"id":"https://openalex.org/I27483092","display_name":"University of Perugia","ror":"https://ror.org/00x27da85","country_code":"IT","type":"education","lineage":["https://openalex.org/I27483092"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Mario L. Fravolini","raw_affiliation_strings":["Department of Engineering, University of Perugia, Perugia, Italy"],"raw_orcid":"https://orcid.org/0000-0002-3104-8782","affiliations":[{"raw_affiliation_string":"Department of Engineering, University of Perugia, Perugia, Italy","institution_ids":["https://openalex.org/I27483092"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.3051,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.60059521,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"22","issue":"1","first_page":"271","last_page":"283"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.993399977684021,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9873999953269958,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.9024693965911865},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6766263246536255},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6516597270965576},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.61905437707901},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.5289183855056763},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.4515416622161865},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.4244816303253174},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.42246392369270325},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3719853162765503},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3222864270210266},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.3066006600856781}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9024693965911865},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6766263246536255},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6516597270965576},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.61905437707901},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.5289183855056763},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.4515416622161865},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.4244816303253174},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.42246392369270325},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3719853162765503},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3222864270210266},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3066006600856781},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/tmm.2019.2924598","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2019.2924598","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},{"id":"pmh:oai:iris.unimore.it:11380/1200034","is_oa":true,"landing_page_url":"http://hdl.handle.net/11380/1200034","pdf_url":null,"source":{"id":"https://openalex.org/S4306400718","display_name":"IRIS UNIMORE (University of Modena and Reggio Emilia)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I122346577","host_organization_name":"University of Modena and Reggio Emilia","host_organization_lineage":["https://openalex.org/I122346577"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/article"},{"id":"pmh:oai:iris.uniroma1.it:11573/1494382","is_oa":true,"landing_page_url":"http://hdl.handle.net/11573/1494382","pdf_url":null,"source":{"id":"https://openalex.org/S4377196107","display_name":"IRIS Research product catalog (Sapienza University of Rome)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":{"id":"pmh:oai:iris.unimore.it:11380/1200034","is_oa":true,"landing_page_url":"http://hdl.handle.net/11380/1200034","pdf_url":null,"source":{"id":"https://openalex.org/S4306400718","display_name":"IRIS UNIMORE (University of Modena and Reggio Emilia)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I122346577","host_organization_name":"University of Modena and Reggio Emilia","host_organization_lineage":["https://openalex.org/I122346577"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.7200000286102295,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320309480","display_name":"Nvidia","ror":"https://ror.org/03jdj4y14"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":91,"referenced_works":["https://openalex.org/W1514535095","https://openalex.org/W1522734439","https://openalex.org/W1566289585","https://openalex.org/W1572567476","https://openalex.org/W1614298861","https://openalex.org/W1775434803","https://openalex.org/W1923211482","https://openalex.org/W1924770834","https://openalex.org/W1956340063","https://openalex.org/W1961147827","https://openalex.org/W1976080191","https://openalex.org/W1990227137","https://openalex.org/W2064675550","https://openalex.org/W2078238240","https://openalex.org/W2101105183","https://openalex.org/W2123301721","https://openalex.org/W2139501017","https://openalex.org/W2142900973","https://openalex.org/W2152984213","https://openalex.org/W2154652894","https://openalex.org/W2155837945","https://openalex.org/W2164290393","https://openalex.org/W2187089797","https://openalex.org/W2194775991","https://openalex.org/W2250539671","https://openalex.org/W2251353663","https://openalex.org/W2331128040","https://openalex.org/W2425121537","https://openalex.org/W2475287302","https://openalex.org/W2502312327","https://openalex.org/W2506483933","https://openalex.org/W2528841789","https://openalex.org/W2530645150","https://openalex.org/W2557264465","https://openalex.org/W2564590796","https://openalex.org/W2596543464","https://openalex.org/W2600067905","https://openalex.org/W2610850660","https://openalex.org/W2618530766","https://openalex.org/W2735810033","https://openalex.org/W2739107216","https://openalex.org/W2753311918","https://openalex.org/W2754689878","https://openalex.org/W2763440627","https://openalex.org/W2766520430","https://openalex.org/W2766862947","https://openalex.org/W2773842746","https://openalex.org/W2783838156","https://openalex.org/W2788738262","https://openalex.org/W2793476612","https://openalex.org/W2803620531","https://openalex.org/W2808203533","https://openalex.org/W2808647806","https://openalex.org/W2882971061","https://openalex.org/W2885775891","https://openalex.org/W2892269335","https://openalex.org/W2914699769","https://openalex.org/W2962681491","https://openalex.org/W2962937869","https://openalex.org/W2962958773","https://openalex.org/W2963177403","https://openalex.org/W2963410018","https://openalex.org/W2963525668","https://openalex.org/W2963552819","https://openalex.org/W2963683323","https://openalex.org/W2964065937","https://openalex.org/W2964241990","https://openalex.org/W3098341425","https://openalex.org/W3098682680","https://openalex.org/W3099884890","https://openalex.org/W3102887392","https://openalex.org/W4221148458","https://openalex.org/W4230097545","https://openalex.org/W6630875275","https://openalex.org/W6633899822","https://openalex.org/W6634126550","https://openalex.org/W6636510571","https://openalex.org/W6637845829","https://openalex.org/W6640212811","https://openalex.org/W6641082943","https://openalex.org/W6678262379","https://openalex.org/W6680145277","https://openalex.org/W6682631176","https://openalex.org/W6682983702","https://openalex.org/W6684090549","https://openalex.org/W6691419566","https://openalex.org/W6702130928","https://openalex.org/W6730522037","https://openalex.org/W6742457766","https://openalex.org/W6746746734","https://openalex.org/W6754923448"],"related_works":["https://openalex.org/W2378211422","https://openalex.org/W4321353415","https://openalex.org/W2130974462","https://openalex.org/W972276598","https://openalex.org/W2086519370","https://openalex.org/W2028665553","https://openalex.org/W2087343574","https://openalex.org/W2535915176","https://openalex.org/W2105860728","https://openalex.org/W4287657826"],"abstract_inverted_index":{"Natural":[0],"language":[1,15],"video":[2],"description":[3],"(NLVD)":[4],"has":[5],"recently":[6],"received":[7],"strong":[8],"interest":[9],"in":[10,119,196],"the":[11,33,48,53,56,59,79,82,89,101,130,133,137,145,149,186,190,197,210],"computer":[12],"vision,":[13],"natural":[14],"processing":[16,54],"(NLP),":[17],"multimedia,":[18],"and":[19,66,113,176,185],"autonomous":[20],"robotics":[21],"communities.":[22],"The":[23,199],"state-of-the-art":[24],"(SotA)":[25],"approaches":[26,38],"obtained":[27],"remarkable":[28],"results":[29],"when":[30],"tested":[31],"on":[32,52,136],"benchmark":[34],"datasets.":[35,43],"However,":[36],"those":[37],"poorly":[39],"generalize":[40],"to":[41,58,76,88,107,128,204,206],"new":[42,187],"In":[44,68],"addition,":[45],"none":[46],"of":[47,55,81,100,132,148,174,189],"existing":[49],"works":[50],"focus":[51],"input":[57],"NLVD":[60,211],"systems,":[61],"which":[62,158],"is":[63,74,94,126,156,159,194,202],"both":[64],"visual":[65,83,102,139],"textual.":[67],"this":[69,143,168],"paper,":[70],"an":[71],"extensive":[72],"study":[73],"presented":[75],"deal":[77],"with":[78,86],"role":[80],"input,":[84],"evaluated":[85],"respect":[87],"overall":[90,138],"NLP":[91],"performance.":[92],"This":[93],"achieved":[95],"by":[96],"performing":[97],"data":[98,140],"augmentation":[99],"component,":[103],"applying":[104],"common":[105],"transformations":[106,135],"model":[108],"camera":[109,114],"distortions,":[110],"noise,":[111],"lighting,":[112],"positioning":[115],"that":[116,167],"are":[117],"typical":[118],"real-world":[120],"operative":[121],"scenarios.":[122],"A":[123],"t-SNE-based":[124],"analysis":[125],"proposed":[127],"evaluate":[129],"effects":[131],"considered":[134],"distribution.":[141],"For":[142],"study,":[144],"English":[146],"subset":[147],"Microsoft":[150],"Research":[151],"Video":[152],"Description":[153],"(MSVD)":[154],"dataset":[155,169,191,201],"considered,":[157],"used":[160,195],"commonly":[161],"for":[162],"NLVD.":[163],"It":[164],"was":[165],"observed":[166],"contains":[170],"a":[171],"relevant":[172],"amount":[173],"syntactic":[175],"semantic":[177],"errors.":[178],"These":[179],"errors":[180],"have":[181],"been":[182],"amended":[183],"manually,":[184],"version":[188],"(called":[192],"MSVD-v2)":[193],"experimentation.":[198],"MSVD-v2":[200],"released":[203],"help":[205],"gain":[207],"insight":[208],"into":[209],"problem.":[212]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
