{"id":"https://openalex.org/W4220656844","doi":"https://doi.org/10.1109/tpami.2022.3157198","title":"Text-Driven Video Acceleration: A Weakly-Supervised Reinforcement Learning Method","display_name":"Text-Driven Video Acceleration: A Weakly-Supervised Reinforcement Learning Method","publication_year":2022,"publication_date":"2022-03-07","ids":{"openalex":"https://openalex.org/W4220656844","doi":"https://doi.org/10.1109/tpami.2022.3157198","pmid":"https://pubmed.ncbi.nlm.nih.gov/35254978"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2022.3157198","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2022.3157198","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2203.15778","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Washington Ramos","orcid":"https://orcid.org/0000-0002-0411-8677"},"institutions":[{"id":"https://openalex.org/I110200422","display_name":"Universidade Federal de Minas Gerais","ror":"https://ror.org/0176yjw32","country_code":"BR","type":"education","lineage":["https://openalex.org/I110200422"]}],"countries":["BR"],"is_corresponding":true,"raw_author_name":"Washington Ramos","raw_affiliation_strings":["Computer Science Department, Universidade Federal de Minas Gerais, Belo Horizonte, MG, Brazil"],"raw_orcid":"https://orcid.org/0000-0002-0411-8677","affiliations":[{"raw_affiliation_string":"Computer Science Department, Universidade Federal de Minas Gerais, Belo Horizonte, MG, Brazil","institution_ids":["https://openalex.org/I110200422"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Michel Silva","orcid":"https://orcid.org/0000-0002-2499-9619"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Michel Silva","raw_affiliation_strings":["Department of Informatics, Universidade Federal de Vi&#x00E7;osa, Vi&#x00E7;osa, Brazil"],"raw_orcid":"https://orcid.org/0000-0002-2499-9619","affiliations":[{"raw_affiliation_string":"Department of Informatics, Universidade Federal de Vi&#x00E7;osa, Vi&#x00E7;osa, Brazil","institution_ids":[]}]},{"author_position":"middle","author":{"id":null,"display_name":"Edson Araujo","orcid":"https://orcid.org/0000-0003-0585-5473"},"institutions":[{"id":"https://openalex.org/I110200422","display_name":"Universidade Federal de Minas Gerais","ror":"https://ror.org/0176yjw32","country_code":"BR","type":"education","lineage":["https://openalex.org/I110200422"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Edson Araujo","raw_affiliation_strings":["Computer Science Department, Universidade Federal de Minas Gerais, Belo Horizonte, MG, Brazil"],"raw_orcid":"https://orcid.org/0000-0003-0585-5473","affiliations":[{"raw_affiliation_string":"Computer Science Department, Universidade Federal de Minas Gerais, Belo Horizonte, MG, Brazil","institution_ids":["https://openalex.org/I110200422"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Victor Moura","orcid":"https://orcid.org/0000-0001-5379-8755"},"institutions":[{"id":"https://openalex.org/I110200422","display_name":"Universidade Federal de Minas Gerais","ror":"https://ror.org/0176yjw32","country_code":"BR","type":"education","lineage":["https://openalex.org/I110200422"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Victor Moura","raw_affiliation_strings":["Computer Science Department, Universidade Federal de Minas Gerais, Belo Horizonte, MG, Brazil"],"raw_orcid":"https://orcid.org/0000-0001-5379-8755","affiliations":[{"raw_affiliation_string":"Computer Science Department, Universidade Federal de Minas Gerais, Belo Horizonte, MG, Brazil","institution_ids":["https://openalex.org/I110200422"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Keller Oliveira","orcid":"https://orcid.org/0000-0002-1287-7729"},"institutions":[{"id":"https://openalex.org/I110200422","display_name":"Universidade Federal de Minas Gerais","ror":"https://ror.org/0176yjw32","country_code":"BR","type":"education","lineage":["https://openalex.org/I110200422"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Keller Oliveira","raw_affiliation_strings":["Computer Science Department, Universidade Federal de Minas Gerais, Belo Horizonte, MG, Brazil"],"raw_orcid":"https://orcid.org/0000-0002-1287-7729","affiliations":[{"raw_affiliation_string":"Computer Science Department, Universidade Federal de Minas Gerais, Belo Horizonte, MG, Brazil","institution_ids":["https://openalex.org/I110200422"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Leandro Soriano Marcolino","orcid":"https://orcid.org/0000-0002-3337-8611"},"institutions":[{"id":"https://openalex.org/I67415387","display_name":"Lancaster University","ror":"https://ror.org/04f2nsd36","country_code":"GB","type":"education","lineage":["https://openalex.org/I67415387"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Leandro Soriano Marcolino","raw_affiliation_strings":["Lancaster University, Lancaster, U.K"],"raw_orcid":"https://orcid.org/0000-0002-3337-8611","affiliations":[{"raw_affiliation_string":"Lancaster University, Lancaster, U.K","institution_ids":["https://openalex.org/I67415387"]}]},{"author_position":"last","author":{"id":null,"display_name":"Erickson R. Nascimento","orcid":"https://orcid.org/0000-0003-2973-2232"},"institutions":[{"id":"https://openalex.org/I110200422","display_name":"Universidade Federal de Minas Gerais","ror":"https://ror.org/0176yjw32","country_code":"BR","type":"education","lineage":["https://openalex.org/I110200422"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Erickson R. Nascimento","raw_affiliation_strings":["Computer Science Department, Universidade Federal de Minas Gerais, Belo Horizonte, MG, Brazil"],"raw_orcid":"https://orcid.org/0000-0003-2973-2232","affiliations":[{"raw_affiliation_string":"Computer Science Department, Universidade Federal de Minas Gerais, Belo Horizonte, MG, Brazil","institution_ids":["https://openalex.org/I110200422"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I110200422"],"apc_list":null,"apc_paid":null,"fwci":0.4082,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.57879353,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"45","issue":"2","first_page":"2492","last_page":"2504"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.5116000175476074,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.5116000175476074,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.3547999858856201,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.04960000142455101,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.7754999995231628},{"id":"https://openalex.org/keywords/automatic-summarization","display_name":"Automatic summarization","score":0.7558000087738037},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.5831999778747559},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.567799985408783},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.3765999972820282},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.36550000309944153},{"id":"https://openalex.org/keywords/task-analysis","display_name":"Task analysis","score":0.3603000044822693},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.3481000065803528},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.3425999879837036}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8382999897003174},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.7754999995231628},{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.7558000087738037},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.692300021648407},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.5831999778747559},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.567799985408783},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4424999952316284},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4052000045776367},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.3765999972820282},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.36550000309944153},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.3603000044822693},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.3481000065803528},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.3425999879837036},{"id":"https://openalex.org/C65483669","wikidata":"https://www.wikidata.org/wiki/Q3536669","display_name":"Video processing","level":2,"score":0.3416000008583069},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.3384000062942505},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.323199987411499},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2797999978065491},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2768000066280365},{"id":"https://openalex.org/C77967617","wikidata":"https://www.wikidata.org/wiki/Q4677561","display_name":"Active learning (machine learning)","level":2,"score":0.272599995136261},{"id":"https://openalex.org/C2988454689","wikidata":"https://www.wikidata.org/wiki/Q173131","display_name":"Digital video","level":3,"score":0.2687999904155731},{"id":"https://openalex.org/C22367795","wikidata":"https://www.wikidata.org/wiki/Q7625208","display_name":"Structured prediction","level":2,"score":0.2632000148296356},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.2621000111103058},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.2565000057220459},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.2556999921798706},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.2547999918460846}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/tpami.2022.3157198","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2022.3157198","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:35254978","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/35254978","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null},{"id":"pmh:oai:arXiv.org:2203.15778","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2203.15778","pdf_url":"https://arxiv.org/pdf/2203.15778","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2203.15778","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2203.15778","pdf_url":"https://arxiv.org/pdf/2203.15778","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321091","display_name":"Coordena\u00e7\u00e3o de Aperfei\u00e7oamento de Pessoal de N\u00edvel Superior","ror":"https://ror.org/00x0ma614"},{"id":"https://openalex.org/F4320322025","display_name":"Conselho Nacional de Desenvolvimento Cient\u00edfico e Tecnol\u00f3gico","ror":"https://ror.org/03swz6y49"},{"id":"https://openalex.org/F4320322468","display_name":"Petrobras","ror":"https://ror.org/0235kyq22"},{"id":"https://openalex.org/F4320322980","display_name":"Funda\u00e7\u00e3o de Amparo \u00e0 Pesquisa do Estado de Minas Gerais","ror":"https://ror.org/00nc55f03"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":59,"referenced_works":["https://openalex.org/W102228831","https://openalex.org/W805710393","https://openalex.org/W1573040851","https://openalex.org/W1895577753","https://openalex.org/W1948812921","https://openalex.org/W1978990080","https://openalex.org/W2003553461","https://openalex.org/W2106229755","https://openalex.org/W2119717200","https://openalex.org/W2145339207","https://openalex.org/W2157331557","https://openalex.org/W2250539671","https://openalex.org/W2302086703","https://openalex.org/W2467794422","https://openalex.org/W2470673105","https://openalex.org/W2515191187","https://openalex.org/W2518952733","https://openalex.org/W2554779556","https://openalex.org/W2559909572","https://openalex.org/W2570848768","https://openalex.org/W2604274373","https://openalex.org/W2613031639","https://openalex.org/W2737677090","https://openalex.org/W2738318237","https://openalex.org/W2746553466","https://openalex.org/W2753311918","https://openalex.org/W2753900927","https://openalex.org/W2761873684","https://openalex.org/W2766447205","https://openalex.org/W2775725209","https://openalex.org/W2781922022","https://openalex.org/W2788106261","https://openalex.org/W2793694687","https://openalex.org/W2795187948","https://openalex.org/W2798554470","https://openalex.org/W2910905530","https://openalex.org/W2941599692","https://openalex.org/W2952132648","https://openalex.org/W2957775769","https://openalex.org/W2960416371","https://openalex.org/W2962795934","https://openalex.org/W2963017553","https://openalex.org/W2963155035","https://openalex.org/W2963919999","https://openalex.org/W2963997278","https://openalex.org/W2980037812","https://openalex.org/W2989322838","https://openalex.org/W3011215845","https://openalex.org/W3014832178","https://openalex.org/W3024615975","https://openalex.org/W3034424800","https://openalex.org/W3108154605","https://openalex.org/W3121043223","https://openalex.org/W6631190155","https://openalex.org/W6638667902","https://openalex.org/W6692846177","https://openalex.org/W6695190136","https://openalex.org/W6738806211","https://openalex.org/W6739901393"],"related_works":[],"abstract_inverted_index":{"The":[0],"growth":[1],"of":[2,38],"videos":[3,19,72],"in":[4,101,140],"our":[5,81,134],"digital":[6],"age":[7],"and":[8,51,89,127,143],"the":[9,14,25,29,53,91,102,108,137,147,152],"users'":[10],"limited":[11],"time":[12],"raise":[13],"demand":[15],"for":[16],"processing":[17],"untrimmed":[18],"to":[20,69,83,87,94,123],"produce":[21],"shorter":[22],"versions":[23],"conveying":[24],"same":[26],"information.":[27],"Despite":[28],"remarkable":[30],"progress":[31],"that":[32,133],"summarization":[33],"methods":[34],"have":[35],"made,":[36],"most":[37],"them":[39],"can":[40,116],"only":[41],"select":[42,84],"a":[43,59,65,95,118],"few":[44],"frames":[45,86],"or":[46],"skims,":[47],"creating":[48,99],"visual":[49,128],"gaps":[50,100],"breaking":[52],"video":[54,93],"context.":[55],"This":[56],"paper":[57],"presents":[58],"novel":[60,76],"weakly-supervised":[61],"methodology":[62],"based":[63],"on":[64],"reinforcement":[66],"learning":[67],"formulation":[68],"accelerate":[70],"instructional":[71],"using":[73],"text.":[74],"A":[75],"joint":[77],"reward":[78],"function":[79],"guides":[80],"agent":[82],"which":[85,115],"remove":[88],"reduce":[90],"input":[92],"target":[96],"length":[97],"without":[98],"final":[103],"video.":[104],"We":[105],"also":[106],"propose":[107],"Extended":[109],"Visually-guided":[110],"Document":[111],"Attention":[112],"Network":[113],"(VDAN+),":[114],"generate":[117],"highly":[119],"discriminative":[120],"embedding":[121],"space":[122],"represent":[124],"both":[125],"textual":[126],"data.":[129],"Our":[130],"experiments":[131],"show":[132],"method":[135],"achieves":[136],"best":[138],"performance":[139],"Precision,":[141],"Recall,":[142],"F1":[144],"Score":[145],"against":[146],"baselines":[148],"while":[149],"effectively":[150],"controlling":[151],"video's":[153],"output":[154],"length.":[155]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2022-04-03T00:00:00"}
