{"id":"https://openalex.org/W4387968400","doi":"https://doi.org/10.1145/3581783.3612544","title":"Focusing on Flexible Masks: A Novel Framework for Panoptic Scene Graph Generation with Relation Constraints","display_name":"Focusing on Flexible Masks: A Novel Framework for Panoptic Scene Graph Generation with Relation Constraints","publication_year":2023,"publication_date":"2023-10-26","ids":{"openalex":"https://openalex.org/W4387968400","doi":"https://doi.org/10.1145/3581783.3612544"},"language":"en","primary_location":{"id":"doi:10.1145/3581783.3612544","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3581783.3612544","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3581783.3612544","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3581783.3612544","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5043898996","display_name":"Jiarui Yang","orcid":"https://orcid.org/0000-0002-0027-4517"},"institutions":[{"id":"https://openalex.org/I4210156404","display_name":"Institute of Information Engineering","ror":"https://ror.org/04r53se39","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210156404"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiarui Yang","raw_affiliation_strings":["SKLOIS, Institute of Information Engineering, CAS, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-0027-4517","affiliations":[{"raw_affiliation_string":"SKLOIS, Institute of Information Engineering, CAS, Beijing, China","institution_ids":["https://openalex.org/I4210156404"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100443616","display_name":"Chuan Wang","orcid":"https://orcid.org/0000-0003-3856-7646"},"institutions":[{"id":"https://openalex.org/I4210156404","display_name":"Institute of Information Engineering","ror":"https://ror.org/04r53se39","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210156404"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chuan Wang","raw_affiliation_strings":["SKLOIS, Institute of Information Engineering, CAS, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-3856-7646","affiliations":[{"raw_affiliation_string":"SKLOIS, Institute of Information Engineering, CAS, Beijing, China","institution_ids":["https://openalex.org/I4210156404"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103008895","display_name":"Zeming Liu","orcid":"https://orcid.org/0000-0002-3691-8097"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zeming Liu","raw_affiliation_strings":["School of Computer Science and Engineering, Beihang University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-3691-8097","affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102984394","display_name":"Jiahong Wu","orcid":"https://orcid.org/0000-0001-8583-0414"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiahong Wu","raw_affiliation_strings":["Kuai shou, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-8583-0414","affiliations":[{"raw_affiliation_string":"Kuai shou, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008722548","display_name":"Dongsheng Wang","orcid":"https://orcid.org/0000-0002-0255-1936"},"institutions":[{"id":"https://openalex.org/I177955009","display_name":"China University of Political Science and Law","ror":"https://ror.org/00e49gy82","country_code":"CN","type":"education","lineage":["https://openalex.org/I177955009"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dongsheng Wang","raw_affiliation_strings":["The Department of Science and Technology Teaching, China University of Political Science and Law, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-0255-1936","affiliations":[{"raw_affiliation_string":"The Department of Science and Technology Teaching, China University of Political Science and Law, Beijing, China","institution_ids":["https://openalex.org/I177955009"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003769188","display_name":"Liang Yang","orcid":"https://orcid.org/0000-0001-6291-4359"},"institutions":[{"id":"https://openalex.org/I184843921","display_name":"Hebei University of Technology","ror":"https://ror.org/018hded08","country_code":"CN","type":"education","lineage":["https://openalex.org/I184843921"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liang Yang","raw_affiliation_strings":["School of Artificial Intelligence, Hebei University of Technology, Tianjin, China"],"raw_orcid":"https://orcid.org/0000-0001-6291-4359","affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Hebei University of Technology, Tianjin, China","institution_ids":["https://openalex.org/I184843921"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5068837264","display_name":"Xiaochun Cao","orcid":"https://orcid.org/0000-0001-7141-708X"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaochun Cao","raw_affiliation_strings":["School of Cyber Science and Technology, Shenzhen Campus of Sun Yat-Sen University, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0001-7141-708X","affiliations":[{"raw_affiliation_string":"School of Cyber Science and Technology, Shenzhen Campus of Sun Yat-Sen University, Shenzhen, China","institution_ids":["https://openalex.org/I157773358"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5043898996"],"corresponding_institution_ids":["https://openalex.org/I4210156404"],"apc_list":null,"apc_paid":null,"fwci":0.942,"has_fulltext":true,"cited_by_count":8,"citation_normalized_percentile":{"value":0.77670904,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"4209","last_page":"4218"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7410614490509033},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.708410382270813},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6780792474746704},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6172993183135986},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5826900005340576},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.4983561038970947},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.4843062460422516},{"id":"https://openalex.org/keywords/relation","display_name":"Relation (database)","score":0.45483726263046265},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.4537712037563324},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4490917921066284},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.44461044669151306},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.4291728138923645},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3876638412475586},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3237581253051758},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.2235202193260193},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.20461991429328918},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.16788643598556519}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7410614490509033},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.708410382270813},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6780792474746704},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6172993183135986},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5826900005340576},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.4983561038970947},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.4843062460422516},{"id":"https://openalex.org/C25343380","wikidata":"https://www.wikidata.org/wiki/Q277521","display_name":"Relation (database)","level":2,"score":0.45483726263046265},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.4537712037563324},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4490917921066284},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.44461044669151306},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.4291728138923645},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3876638412475586},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3237581253051758},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2235202193260193},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.20461991429328918},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.16788643598556519},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3581783.3612544","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3581783.3612544","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3581783.3612544","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3581783.3612544","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3581783.3612544","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3581783.3612544","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM International Conference on Multimedia","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3628717404","display_name":null,"funder_award_id":"61972442","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3746838127","display_name":null,"funder_award_id":"2021M703472","funder_id":"https://openalex.org/F4320321543","funder_display_name":"China Postdoctoral Science Foundation"},{"id":"https://openalex.org/G498447184","display_name":null,"funder_award_id":"62102413","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7183324353","display_name":null,"funder_award_id":"U1936208","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321543","display_name":"China Postdoctoral Science Foundation","ror":"https://ror.org/0426zh255"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4387968400.pdf","grobid_xml":"https://content.openalex.org/works/W4387968400.grobid-xml"},"referenced_works_count":47,"referenced_works":["https://openalex.org/W1861492603","https://openalex.org/W2077069816","https://openalex.org/W2277195237","https://openalex.org/W2607855566","https://openalex.org/W2910628332","https://openalex.org/W2913618459","https://openalex.org/W2962779575","https://openalex.org/W2963101956","https://openalex.org/W2963184176","https://openalex.org/W2963518342","https://openalex.org/W2963536419","https://openalex.org/W2963649796","https://openalex.org/W2963902384","https://openalex.org/W2963938081","https://openalex.org/W2965182628","https://openalex.org/W2987919422","https://openalex.org/W3010277541","https://openalex.org/W3034355852","https://openalex.org/W3034538190","https://openalex.org/W3035017890","https://openalex.org/W3035454069","https://openalex.org/W3081642947","https://openalex.org/W3096609285","https://openalex.org/W3106328333","https://openalex.org/W3107530881","https://openalex.org/W3108864070","https://openalex.org/W3168649818","https://openalex.org/W3174865181","https://openalex.org/W3177248696","https://openalex.org/W3180659539","https://openalex.org/W3181556077","https://openalex.org/W3182902595","https://openalex.org/W3196936439","https://openalex.org/W3213165621","https://openalex.org/W4214693531","https://openalex.org/W4286982960","https://openalex.org/W4288083516","https://openalex.org/W4312555984","https://openalex.org/W4312563197","https://openalex.org/W4312682661","https://openalex.org/W4312744661","https://openalex.org/W4312815172","https://openalex.org/W4312936847","https://openalex.org/W4313161463","https://openalex.org/W4386075638","https://openalex.org/W4390874575","https://openalex.org/W6797784111"],"related_works":["https://openalex.org/W4285411112","https://openalex.org/W3166204570","https://openalex.org/W3121246613","https://openalex.org/W2085033728","https://openalex.org/W2132137594","https://openalex.org/W2171299904","https://openalex.org/W2798482732","https://openalex.org/W4390494008","https://openalex.org/W2922442631","https://openalex.org/W2053596378"],"abstract_inverted_index":{"Panoptic":[0],"Scene":[1,22],"Graph":[2,23],"Generation":[3,24],"(PSG)":[4],"presents":[5],"pixel-wise":[6],"instance":[7,65],"detection":[8],"and":[9,14,39,85,163,189,202],"localization,":[10],"leading":[11],"to":[12,27,79,95,160],"comprehensive":[13],"precise":[15],"scene":[16,97,193],"graphs.":[17,194],"Current":[18],"methods":[19],"employ":[20],"conventional":[21],"(SGG)":[25],"frameworks":[26],"solve":[28],"the":[29,33,54,69,89,111,115,133,142,148,171,183],"PSG":[30,112],"problem,":[31],"neglecting":[32],"fundamental":[34],"differences":[35],"between":[36],"bounding":[37,42],"boxes":[38,43],"masks,":[40],"i.e.,":[41],"are":[44,49],"allowed":[45],"overlap":[46],"but":[47],"masks":[48,60],"not.":[50],"Since":[51],"segmentation":[52,93,127,162,167,175],"from":[53,132,177],"panoptic":[55,135],"head":[56,136],"has":[57],"deviations,":[58],"non-overlapping":[59],"may":[61,75],"not":[62,76],"afford":[63],"complete":[64,192],"information.":[66],"Subsequently,":[67],"in":[68],"training":[70,116,145],"phase,":[71,91,117,150],"incomplete":[72,92,96],"segmented":[73],"instances":[74,188],"be":[77],"well-aligned":[78],"annotated":[80],"ones,":[81],"causing":[82],"mismatched":[83],"relations":[84],"insufficient":[86],"training.":[87],"During":[88],"inference":[90,149],"leads":[94],"graph":[98],"prediction.":[99],"To":[100],"alleviate":[101],"these":[102],"problems,":[103],"we":[104,118,151],"construct":[105],"a":[106,120,165],"novel":[107],"two-stage":[108],"framework":[109],"for":[110,137],"problem.":[113],"In":[114,147],"design":[119,164],"proposal":[121],"matching":[122],"strategy,":[123],"which":[124],"replaces":[125],"deterministic":[126],"results":[128,176,197],"with":[129],"proposals":[130,178],"extracted":[131],"off-the-shelf":[134],"label":[138],"alignment,":[139],"thereby":[140],"ensuring":[141],"all-matching":[143],"of":[144,156,173],"samples.":[146],"present":[152],"an":[153],"innovative":[154],"concept":[155],"employing":[157],"relation":[158,181],"predictions":[159],"constrain":[161],"relation-constrained":[166],"algorithm.":[168],"By":[169],"reconstructing":[170],"process":[172],"generating":[174],"using":[179],"predicted":[180],"results,":[182],"algorithm":[184],"recovers":[185],"more":[186,191],"valid":[187],"predicts":[190],"The":[195],"experimental":[196],"show":[198],"overall":[199],"superiority,":[200],"effectiveness,":[201],"robustness":[203],"against":[204],"adversarial":[205],"attacks.":[206]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":5}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
