{"id":"https://openalex.org/W3120594693","doi":"https://doi.org/10.1117/12.2587152","title":"Multimodal features for shots boundary detection","display_name":"Multimodal features for shots boundary detection","publication_year":2021,"publication_date":"2021-01-04","ids":{"openalex":"https://openalex.org/W3120594693","doi":"https://doi.org/10.1117/12.2587152","mag":"3120594693"},"language":"en","primary_location":{"id":"doi:10.1117/12.2587152","is_oa":false,"landing_page_url":"https://doi.org/10.1117/12.2587152","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Thirteenth International Conference on Machine Vision","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5068355128","display_name":"Mohamed Bouyahi","orcid":null},"institutions":[{"id":"https://openalex.org/I142899784","display_name":"University of Sfax","ror":"https://ror.org/04d4sd432","country_code":"TN","type":"education","lineage":["https://openalex.org/I142899784"]}],"countries":["TN"],"is_corresponding":true,"raw_author_name":"Mohamed Bouyahi","raw_affiliation_strings":["Sfax Univ. (Tunisia)"],"affiliations":[{"raw_affiliation_string":"Sfax Univ. (Tunisia)","institution_ids":["https://openalex.org/I142899784"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5002474870","display_name":"Yassine Ben Ayed","orcid":"https://orcid.org/0000-0002-3676-3670"},"institutions":[{"id":"https://openalex.org/I142899784","display_name":"University of Sfax","ror":"https://ror.org/04d4sd432","country_code":"TN","type":"education","lineage":["https://openalex.org/I142899784"]}],"countries":["TN"],"is_corresponding":false,"raw_author_name":"Yassine Ben Ayed","raw_affiliation_strings":["Sfax Univ. (Tunisia)"],"affiliations":[{"raw_affiliation_string":"Sfax Univ. (Tunisia)","institution_ids":["https://openalex.org/I142899784"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5068355128"],"corresponding_institution_ids":["https://openalex.org/I142899784"],"apc_list":null,"apc_paid":null,"fwci":0.1921,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.45106209,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"47","last_page":"47"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10741","display_name":"Video Coding and Compression Technologies","score":0.9830999970436096,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.822736918926239},{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.7445284724235535},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7228775024414062},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.6469465494155884},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6110488176345825},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5383905172348022},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.5246251225471497},{"id":"https://openalex.org/keywords/similarity-measure","display_name":"Similarity measure","score":0.45747730135917664},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4551742374897003},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.43457168340682983},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.43094468116760254},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.18054619431495667}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.822736918926239},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.7445284724235535},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7228775024414062},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.6469465494155884},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6110488176345825},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5383905172348022},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.5246251225471497},{"id":"https://openalex.org/C2776517306","wikidata":"https://www.wikidata.org/wiki/Q29017317","display_name":"Similarity measure","level":2,"score":0.45747730135917664},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4551742374897003},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.43457168340682983},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.43094468116760254},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.18054619431495667},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1117/12.2587152","is_oa":false,"landing_page_url":"https://doi.org/10.1117/12.2587152","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Thirteenth International Conference on Machine Vision","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3024364549","https://openalex.org/W2319693127","https://openalex.org/W308539617","https://openalex.org/W2072263576","https://openalex.org/W2095030957","https://openalex.org/W2066827917","https://openalex.org/W2474567666","https://openalex.org/W1940044583","https://openalex.org/W2806903871","https://openalex.org/W4320802053"],"abstract_inverted_index":{"Shot":[0],"Boundary":[1],"Detection":[2],"(SBD)":[3],"also":[4],"known":[5],"as":[6,20],"a":[7,12,156],"temporal":[8,29],"video":[9,56],"segmentation":[10,122],"is":[11,57,137],"preprocessing":[13],"task":[14],"for":[15,50,114,131],"multiple":[16],"videos":[17],"applications,":[18],"such":[19],"indexing":[21],"and":[22,117],"retrieval.":[23],"The":[24,36,134],"SBD":[25,84],"output":[26],"provides":[27],"coherent":[28],"units":[30],"which":[31,62],"are":[32],"easy":[33],"to":[34,47,70,76,81,129],"manipulate.":[35],"Most":[37],"previous":[38],"works":[39],"implement":[40],"theirs":[41],"frameworks":[42],"based":[43,123],"on":[44,89,124,139,145],"visual":[45,115,167],"features":[46,98,108],"measure":[48],"similarity":[49,95,116],"transition":[51,132],"detection":[52],"task.":[53,85],"However,":[54],"the":[55,78,83,120,140,150,161],"very":[58],"enriched":[59],"by":[60,93],"data":[61,147],"could":[63],"be":[64],"beneficial.":[65],"In":[66],"this":[67,146],"paper,":[68],"referring":[69],"recent":[71],"multimodal":[72,152],"works,":[73],"we":[74,87,105,118],"propose":[75],"introduce":[77],"audio":[79,121],"components":[80],"increase":[82],"Firstly,":[86],"worked":[88],"candidate":[90],"segments":[91],"obtained":[92,109],"measuring":[94],"between":[96],"low":[97],"(SURF,":[99],"HSF)":[100],"from":[101,110],"original":[102],"video.":[103],"Then":[104],"used":[106,166],"deep":[107],"trained":[111],"model":[112],"(Resnet-50)":[113],"introduced":[119],"Power":[125],"Spectrum":[126],"Density":[127],"(PSD)":[128],"contribute":[130],"detection.":[133],"proposed":[135,151],"method":[136],"evaluated":[138],"clip":[141],"shots":[142],"dataset.":[143],"Experiments":[144],"show":[148],"that":[149,165],"approach":[153],"can":[154],"achieve":[155],"better":[157],"performance":[158],"compared":[159],"with":[160],"state-of-the-art":[162],"of":[163],"methods":[164],"approach.":[168]},"counts_by_year":[{"year":2023,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
