{"id":"https://openalex.org/W4391149069","doi":"https://doi.org/10.1109/ic-nidc59918.2023.10390866","title":"Dense Local Consistency Loss for Video Semantic Segmentation","display_name":"Dense Local Consistency Loss for Video Semantic Segmentation","publication_year":2023,"publication_date":"2023-11-03","ids":{"openalex":"https://openalex.org/W4391149069","doi":"https://doi.org/10.1109/ic-nidc59918.2023.10390866"},"language":"en","primary_location":{"id":"doi:10.1109/ic-nidc59918.2023.10390866","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/ic-nidc59918.2023.10390866","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 8th IEEE International Conference on Network Intelligence and Digital Content (IC-NIDC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102608293","display_name":"Ruhao Xia","orcid":null},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Ruhao Xia","raw_affiliation_strings":["School of Artificial Intelligence, Beijing University of Posts and Telecommunications"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Beijing University of Posts and Telecommunications","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100946285","display_name":"Ling Xu","orcid":"https://orcid.org/0009-0009-0122-5686"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xu Ling","raw_affiliation_strings":["School of Artificial Intelligence, Beijing University of Posts and Telecommunications"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Beijing University of Posts and Telecommunications","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100755268","display_name":"Yixiang Huang","orcid":"https://orcid.org/0000-0003-0809-7890"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yixiang Huang","raw_affiliation_strings":["School of Artificial Intelligence, Beijing University of Posts and Telecommunications"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Beijing University of Posts and Telecommunications","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5077902436","display_name":"Ming Wu","orcid":"https://orcid.org/0000-0001-8390-5398"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ming Wu","raw_affiliation_strings":["School of Artificial Intelligence, Beijing University of Posts and Telecommunications"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Beijing University of Posts and Telecommunications","institution_ids":["https://openalex.org/I139759216"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5102608293"],"corresponding_institution_ids":["https://openalex.org/I139759216"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.19091234,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"34","issue":null,"first_page":"389","last_page":"393"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7784910202026367},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.7593193650245667},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6752760410308838},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.50914067029953},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.5013618469238281},{"id":"https://openalex.org/keywords/scale-space-segmentation","display_name":"Scale-space segmentation","score":0.4890469014644623},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.47727006673812866},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.4537906050682068},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.44896531105041504},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.4332408905029297},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.372539758682251}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7784910202026367},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.7593193650245667},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6752760410308838},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.50914067029953},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.5013618469238281},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.4890469014644623},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.47727006673812866},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.4537906050682068},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.44896531105041504},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.4332408905029297},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.372539758682251},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ic-nidc59918.2023.10390866","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/ic-nidc59918.2023.10390866","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 8th IEEE International Conference on Network Intelligence and Digital Content (IC-NIDC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G8698067272","display_name":null,"funder_award_id":"62076093","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W1903029394","https://openalex.org/W1923697677","https://openalex.org/W2552900565","https://openalex.org/W2560023338","https://openalex.org/W2561585794","https://openalex.org/W2806676437","https://openalex.org/W2955058313","https://openalex.org/W2962815021","https://openalex.org/W2963866581","https://openalex.org/W2981689412","https://openalex.org/W3108812043","https://openalex.org/W3169367294","https://openalex.org/W3204976424","https://openalex.org/W3211490618","https://openalex.org/W3213165621","https://openalex.org/W4312723735","https://openalex.org/W4312919100","https://openalex.org/W6640295612","https://openalex.org/W6797399245","https://openalex.org/W6798837711"],"related_works":["https://openalex.org/W2185902295","https://openalex.org/W2103507220","https://openalex.org/W3144569342","https://openalex.org/W2945274617","https://openalex.org/W4313052709","https://openalex.org/W2022929107","https://openalex.org/W2055202857","https://openalex.org/W80586315","https://openalex.org/W4205800335","https://openalex.org/W2758994127"],"abstract_inverted_index":{"Existing":[0],"image":[1],"semantic":[2,59,70,105,136,158],"segmentation":[3,106,114,137,159],"models":[4],"often":[5],"suffer":[6],"from":[7],"temporal":[8,111],"inconsistency":[9],"between":[10,62],"consecutive":[11,63,90],"frames":[12,64,118],"when":[13],"processing":[14],"continuous":[15],"video":[16,69,104,135,157],"inputs.":[17],"While":[18],"using":[19],"optical":[20],"flow":[21],"or":[22,123],"incorporating":[23],"historical":[24],"frame":[25],"information":[26],"can":[27],"alleviate":[28],"this":[29],"issue,":[30],"the":[31,66,79,86,110,132,142,162],"resulting":[32],"increase":[33],"in":[34,65,89,153],"parameters":[35,122],"and":[36,103,108,113,156],"computational":[37,124],"complexity":[38],"is":[39,75,94],"detrimental":[40],"to":[41,140],"real-time":[42],"tasks.":[43],"In":[44],"contrast,":[45],"we":[46],"propose":[47],"a":[48],"dense":[49],"local":[50,58],"consistency":[51,60,112],"loss":[52],"dubbed":[53],"DLCL,":[54],"which":[55],"introduces":[56],"spatial":[57],"constraints":[61],"task":[67],"of":[68,82,116,144,164],"segmentation.":[71],"During":[72],"training,":[73],"DLCL":[74,93],"calculated":[76],"based":[77],"on":[78,131],"cosine":[80],"similarity":[81],"feature":[83],"embeddings":[84],"for":[85],"same":[87],"object":[88],"frames.":[91],"Our":[92],"simple":[95],"yet":[96],"effective,":[97],"easily":[98],"integrated":[99],"into":[100],"both":[101,154],"single-frame":[102],"models,":[107,160],"improves":[109],"accuracy":[115],"predicted":[117],"without":[119],"adding":[120],"any":[121],"overhead":[125],"during":[126],"inference.":[127],"We":[128],"conduct":[129],"experiments":[130],"large-scale":[133],"multi-scene":[134],"dataset:":[138],"VSPW,":[139],"demonstrate":[141],"effectiveness":[143],"our":[145,165],"approach.":[146],"The":[147],"results":[148],"consistently":[149],"show":[150],"performance":[151],"improvements":[152],"singleframe":[155],"validating":[161],"efficacy":[163],"method.":[166]},"counts_by_year":[],"updated_date":"2025-12-21T23:12:01.093139","created_date":"2025-10-10T00:00:00"}
