{"id":"https://openalex.org/W3196286078","doi":"https://doi.org/10.23919/mva51890.2021.9511350","title":"Video Summarization With Frame Index Vision Transformer","display_name":"Video Summarization With Frame Index Vision Transformer","publication_year":2021,"publication_date":"2021-07-25","ids":{"openalex":"https://openalex.org/W3196286078","doi":"https://doi.org/10.23919/mva51890.2021.9511350","mag":"3196286078"},"language":"en","primary_location":{"id":"doi:10.23919/mva51890.2021.9511350","is_oa":false,"landing_page_url":"https://doi.org/10.23919/mva51890.2021.9511350","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 17th International Conference on Machine Vision and Applications (MVA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072282992","display_name":"Tzu\u2010Chun Hsu","orcid":"https://orcid.org/0000-0001-6503-8139"},"institutions":[{"id":"https://openalex.org/I162838928","display_name":"National Chung Hsing University","ror":"https://ror.org/05vn3ca78","country_code":"TW","type":"education","lineage":["https://openalex.org/I162838928"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Tzu-Chun Hsu","raw_affiliation_strings":["National Chung Hsing University, Taichung, Taiwan"],"affiliations":[{"raw_affiliation_string":"National Chung Hsing University, Taichung, Taiwan","institution_ids":["https://openalex.org/I162838928"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072894881","display_name":"Yi-Sheng Liao","orcid":"https://orcid.org/0009-0009-5122-3996"},"institutions":[{"id":"https://openalex.org/I162838928","display_name":"National Chung Hsing University","ror":"https://ror.org/05vn3ca78","country_code":"TW","type":"education","lineage":["https://openalex.org/I162838928"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Yi-Sheng Liao","raw_affiliation_strings":["National Chung Hsing University, Taichung, Taiwan"],"affiliations":[{"raw_affiliation_string":"National Chung Hsing University, Taichung, Taiwan","institution_ids":["https://openalex.org/I162838928"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5082146813","display_name":"Chun-Rong Huang","orcid":"https://orcid.org/0000-0003-2372-5429"},"institutions":[{"id":"https://openalex.org/I162838928","display_name":"National Chung Hsing University","ror":"https://ror.org/05vn3ca78","country_code":"TW","type":"education","lineage":["https://openalex.org/I162838928"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chun-Rong Huang","raw_affiliation_strings":["National Chung Hsing University, Taichung, Taiwan"],"affiliations":[{"raw_affiliation_string":"National Chung Hsing University, Taichung, Taiwan","institution_ids":["https://openalex.org/I162838928"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5072282992"],"corresponding_institution_ids":["https://openalex.org/I162838928"],"apc_list":null,"apc_paid":null,"fwci":0.4803,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.64937908,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9678000211715698,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7957046031951904},{"id":"https://openalex.org/keywords/automatic-summarization","display_name":"Automatic summarization","score":0.7876812219619751},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.7713479995727539},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6844998598098755},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6562201380729675},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6407598853111267},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.5750949382781982},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5193946957588196},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.5177911520004272},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.46483349800109863},{"id":"https://openalex.org/keywords/index","display_name":"Index (typography)","score":0.41860222816467285},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.40454304218292236},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4010462164878845},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.07847633957862854}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7957046031951904},{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.7876812219619751},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.7713479995727539},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6844998598098755},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6562201380729675},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6407598853111267},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.5750949382781982},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5193946957588196},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.5177911520004272},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.46483349800109863},{"id":"https://openalex.org/C2777382242","wikidata":"https://www.wikidata.org/wiki/Q6017816","display_name":"Index (typography)","level":2,"score":0.41860222816467285},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.40454304218292236},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4010462164878845},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.07847633957862854},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.23919/mva51890.2021.9511350","is_oa":false,"landing_page_url":"https://doi.org/10.23919/mva51890.2021.9511350","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 17th International Conference on Machine Vision and Applications (MVA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1352019532","display_name":null,"funder_award_id":"MOST109-2221-E-005-063,MOST109-2314-B-006-024,MOST110-2327-B-006-006","funder_id":"https://openalex.org/F4320309618","funder_display_name":"Ministry of Science and Technology"}],"funders":[{"id":"https://openalex.org/F4320309618","display_name":"Ministry of Science and Technology","ror":"https://ror.org/02b207r52"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W1502713047","https://openalex.org/W1904325426","https://openalex.org/W1924343884","https://openalex.org/W1966872876","https://openalex.org/W1994864760","https://openalex.org/W2006180404","https://openalex.org/W2068329823","https://openalex.org/W2070490307","https://openalex.org/W2105174364","https://openalex.org/W2109152179","https://openalex.org/W2115060048","https://openalex.org/W2115857089","https://openalex.org/W2119821739","https://openalex.org/W2139009685","https://openalex.org/W2151379678","https://openalex.org/W2194775991","https://openalex.org/W2517959782","https://openalex.org/W2529272619","https://openalex.org/W2737677090","https://openalex.org/W2793668851","https://openalex.org/W2798970487","https://openalex.org/W2902616437","https://openalex.org/W2906430987","https://openalex.org/W2963263347","https://openalex.org/W2963403868","https://openalex.org/W2963919999","https://openalex.org/W2964158702","https://openalex.org/W2964167369","https://openalex.org/W3094502228","https://openalex.org/W3107128832","https://openalex.org/W3119786062","https://openalex.org/W4237634276","https://openalex.org/W4239510810","https://openalex.org/W4385245566","https://openalex.org/W6640109428","https://openalex.org/W6676302953","https://openalex.org/W6677302653","https://openalex.org/W6726497184","https://openalex.org/W6739901393","https://openalex.org/W6741802007","https://openalex.org/W6751495912","https://openalex.org/W6784333009"],"related_works":["https://openalex.org/W2366403280","https://openalex.org/W1495108544","https://openalex.org/W2091301346","https://openalex.org/W3148229873","https://openalex.org/W2150160875","https://openalex.org/W4242223894","https://openalex.org/W1517524280","https://openalex.org/W4323520239","https://openalex.org/W4317547544","https://openalex.org/W4313395829"],"abstract_inverted_index":{"In":[0,96],"this":[1],"paper,":[2],"we":[3,17],"propose":[4],"a":[5],"novel":[6],"frame":[7,27,32,43],"index":[8,36,44],"vision":[9,45],"transformer":[10,46],"for":[11],"video":[12],"summarization.":[13],"Given":[14],"training":[15],"frames,":[16],"linearly":[18],"project":[19],"the":[20,23,31,35,41,55,58,64,67,71,91],"content":[21],"of":[22,57,90],"frames":[24],"to":[25,53],"obtain":[26],"embedding.":[28],"By":[29],"incorporating":[30],"embedding":[33,37],"with":[34],"and":[38,50,81,93],"class":[39],"embedding,":[40],"proposed":[42,68],"can":[47,100],"be":[48],"efficiently":[49],"effectively":[51],"applied":[52],"learn":[54],"importance":[56],"input":[59],"frames.":[60],"As":[61],"shown":[62],"in":[63,88],"experimental":[65],"results,":[66],"method":[69,99],"outperforms":[70],"state-of-the-art":[72],"deep":[73],"learning":[74],"methods":[75,87],"including":[76],"recurrent":[77],"neural":[78,83],"network":[79,84],"(RNN)":[80],"convolutional":[82],"(CNN)":[85],"based":[86],"both":[89],"SumMe":[92],"TVSum":[94],"datasets.":[95],"addition,":[97],"our":[98],"achieve":[101],"real-time":[102],"computational":[103],"efficiency":[104],"during":[105],"testing.":[106]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
