{"id":"https://openalex.org/W3174554977","doi":"https://doi.org/10.1109/tmm.2021.3092143","title":"Jointly Learning the Attributes and Composition of Shots for Boundary Detection in Videos","display_name":"Jointly Learning the Attributes and Composition of Shots for Boundary Detection in Videos","publication_year":2021,"publication_date":"2021-06-24","ids":{"openalex":"https://openalex.org/W3174554977","doi":"https://doi.org/10.1109/tmm.2021.3092143","mag":"3174554977"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2021.3092143","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2021.3092143","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5027532584","display_name":"Xuekun Jiang","orcid":"https://orcid.org/0000-0001-6441-4366"},"institutions":[{"id":"https://openalex.org/I75689368","display_name":"Communication University of China","ror":"https://ror.org/04facbs33","country_code":"CN","type":"education","lineage":["https://openalex.org/I75689368"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xuekun Jiang","raw_affiliation_strings":["State Key Laboratory of Media Convergence and Communication, Communication University of China, Beijing, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Media Convergence and Communication, Communication University of China, Beijing, China","institution_ids":["https://openalex.org/I75689368"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047161111","display_name":"Libiao Jin","orcid":"https://orcid.org/0000-0003-4530-2996"},"institutions":[{"id":"https://openalex.org/I75689368","display_name":"Communication University of China","ror":"https://ror.org/04facbs33","country_code":"CN","type":"education","lineage":["https://openalex.org/I75689368"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Libiao Jin","raw_affiliation_strings":["State Key Laboratory of Media Convergence and Communication, Communication University of China, Beijing, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Media Convergence and Communication, Communication University of China, Beijing, China","institution_ids":["https://openalex.org/I75689368"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067715162","display_name":"Anyi Rao","orcid":"https://orcid.org/0000-0003-1004-7753"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Anyi Rao","raw_affiliation_strings":["Department of Information Engineering, The Chinese University of Hong Kong, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"Department of Information Engineering, The Chinese University of Hong Kong, Hong Kong, China","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026272753","display_name":"Linning Xu","orcid":"https://orcid.org/0000-0003-1026-2410"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Linning Xu","raw_affiliation_strings":["Department of Information Engineering, The Chinese University of Hong Kong, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"Department of Information Engineering, The Chinese University of Hong Kong, Hong Kong, China","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010087030","display_name":"Dahua Lin","orcid":"https://orcid.org/0000-0002-8865-7896"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dahua Lin","raw_affiliation_strings":["Department of Information Engineering, The Chinese University of Hong Kong, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"Department of Information Engineering, The Chinese University of Hong Kong, Hong Kong, China","institution_ids":["https://openalex.org/I177725633"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5027532584"],"corresponding_institution_ids":["https://openalex.org/I75689368"],"apc_list":null,"apc_paid":null,"fwci":0.7685,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.73294118,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"24","issue":null,"first_page":"3049","last_page":"3059"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.991100013256073,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/shot","display_name":"Shot (pellet)","score":0.9446420669555664},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8172217607498169},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.698819637298584},{"id":"https://openalex.org/keywords/boundary","display_name":"Boundary (topology)","score":0.6267300844192505},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5979832410812378},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.5145070552825928},{"id":"https://openalex.org/keywords/one-shot","display_name":"One shot","score":0.4557911157608032},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.25592344999313354},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.111630380153656}],"concepts":[{"id":"https://openalex.org/C2778344882","wikidata":"https://www.wikidata.org/wiki/Q278938","display_name":"Shot (pellet)","level":2,"score":0.9446420669555664},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8172217607498169},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.698819637298584},{"id":"https://openalex.org/C62354387","wikidata":"https://www.wikidata.org/wiki/Q875399","display_name":"Boundary (topology)","level":2,"score":0.6267300844192505},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5979832410812378},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.5145070552825928},{"id":"https://openalex.org/C2992734406","wikidata":"https://www.wikidata.org/wiki/Q413267","display_name":"One shot","level":2,"score":0.4557911157608032},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.25592344999313354},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.111630380153656},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tmm.2021.3092143","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2021.3092143","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},{"id":"pmh:oai:repository.hkust.edu.hk:1783.1-141764","is_oa":false,"landing_page_url":"http://lbdiscover.ust.hk/uresolver?url_ver=Z39.88-2004&rft_val_fmt=info:ofi/fmt:kev:mtx:journal&rfr_id=info:sid/HKUST:SPI&rft.genre=article&rft.issn=1520-9210&rft.volume=24&rft.issue=&rft.date=2022&rft.spage=3049&rft.aulast=Jiang&rft.aufirst=Xuekun&rft.atitle=Jointly+Learning+the+Attributes+and+Composition+of+Shots+for+Boundary+Detection+in+Videos&rft.title=IEEE+Transactions+on+Multimedia","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":52,"referenced_works":["https://openalex.org/W204943900","https://openalex.org/W1522734439","https://openalex.org/W1564781546","https://openalex.org/W1661793846","https://openalex.org/W1784139536","https://openalex.org/W1947481528","https://openalex.org/W1971802635","https://openalex.org/W1977991519","https://openalex.org/W1986053712","https://openalex.org/W2000689228","https://openalex.org/W2005750530","https://openalex.org/W2022035644","https://openalex.org/W2044374442","https://openalex.org/W2064675550","https://openalex.org/W2072078925","https://openalex.org/W2077430162","https://openalex.org/W2079735306","https://openalex.org/W2093265140","https://openalex.org/W2106791119","https://openalex.org/W2108431203","https://openalex.org/W2117539524","https://openalex.org/W2139219692","https://openalex.org/W2139501017","https://openalex.org/W2144385786","https://openalex.org/W2158261396","https://openalex.org/W2161827960","https://openalex.org/W2163099731","https://openalex.org/W2194775991","https://openalex.org/W2545708073","https://openalex.org/W2577619402","https://openalex.org/W2608022654","https://openalex.org/W2666798396","https://openalex.org/W2739107216","https://openalex.org/W2753311918","https://openalex.org/W2780608998","https://openalex.org/W2795041432","https://openalex.org/W2798970487","https://openalex.org/W2950846997","https://openalex.org/W2962790054","https://openalex.org/W2962907269","https://openalex.org/W2963315828","https://openalex.org/W2963729528","https://openalex.org/W2965759948","https://openalex.org/W2980037812","https://openalex.org/W2984287396","https://openalex.org/W3034364644","https://openalex.org/W3095481265","https://openalex.org/W3096861448","https://openalex.org/W3102887392","https://openalex.org/W3110420575","https://openalex.org/W6637373629","https://openalex.org/W6739901393"],"related_works":["https://openalex.org/W2497720472","https://openalex.org/W4292659306","https://openalex.org/W3044321615","https://openalex.org/W4294892107","https://openalex.org/W2806221744","https://openalex.org/W2326937258","https://openalex.org/W394267150","https://openalex.org/W2357748469","https://openalex.org/W2392917037","https://openalex.org/W2046675961"],"abstract_inverted_index":{"In":[0,99],"film":[1],"making,":[2],"shot":[3,34,47,82,96,110,134,141,166,181,208],"has":[4],"a":[5,40,104,139,203,220],"profound":[6],"influence":[7],"on":[8,69],"how":[9,16,94],"the":[10,17,56,59,70,116,126,131,158,177,187,194,199,217],"movie":[11,151],"content":[12,74],"is":[13,97,154],"delivered":[14,28],"and":[15,24,58,73,88,118,130,164,172],"audiences":[18],"are":[19,176],"echoed,":[20],"where":[21],"different":[22],"emotions":[23],"contents":[25],"can":[26,191],"be":[27,53],"through":[29],"well-designed":[30],"camera":[31,85,169],"movements":[32],"or":[33],"editing.":[35],"Therefore,":[36],"in":[37,122],"pursuit":[38],"of":[39,43,120,128,133],"high-level":[41],"understanding":[42],"long":[44],"videos,":[45],"accurate":[46],"detection":[48,112,135,196,210],"from":[49,149,212],"untrimmed":[50],"videos":[51],"should":[52],"considered":[54],"as":[55],"first":[57],"most":[60,179],"fundamental":[61],"step.":[62],"Existing":[63],"approaches":[64],"address":[65],"this":[66,100],"problem":[67],"based":[68],"visual":[71],"difference":[72],"transitions":[75],"between":[76,161],"consecutive":[77,162],"frames,":[78],"while":[79],"ignoring":[80],"intrinsic":[81],"attributes,":[83,167],"viz.,":[84],"movements,":[86,170],"scales":[87,171],"viewing":[89,173],"angles,":[90,174],"which":[91,145,175],"essentially":[92],"reveals":[93],"each":[95],"created.":[98],"work,":[101],"we":[102,137],"propose":[103],"new":[105,221],"learning":[106,189],"framework":[107,190],"(SCTSNet)":[108],"for":[109],"boundary":[111,142,160,195,209],"by":[113,202],"jointly":[114],"recognizing":[115],"attributes":[117],"composition":[119],"shots":[121,129,148,163],"videos.":[123],"To":[124],"facilitate":[125],"analysis":[127],"evaluation":[132],"models,":[136],"collect":[138],"large-scale":[140],"dataset":[143],"MovieShots2,":[144],"contains":[146],"15K":[147],"282":[150],"clips.":[152],"It":[153],"richly":[155],"annotated":[156],"with":[157],"temporal":[159],"its":[165],"including":[168],"three":[178],"distinct":[180],"attributes.":[182],"Our":[183],"experiments":[184],"show":[185],"that":[186],"joint":[188],"significantly":[192],"boost":[193],"performance,":[197],"surpassing":[198],"previous":[200],"scores":[201],"large":[204],"margin.":[205],"SCTSNet":[206],"improves":[207],"AP":[211],"0.65":[213],"to":[214,219],"0.77,":[215],"pushing":[216],"performance":[218],"level.":[222]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
