{"id":"https://openalex.org/W4387698214","doi":"https://doi.org/10.1145/3607541.3616817","title":"Multi-View Predicate Recognition for Solving Semantic Ambiguity Problem in Scene Graph Generation","display_name":"Multi-View Predicate Recognition for Solving Semantic Ambiguity Problem in Scene Graph Generation","publication_year":2023,"publication_date":"2023-10-17","ids":{"openalex":"https://openalex.org/W4387698214","doi":"https://doi.org/10.1145/3607541.3616817"},"language":"en","primary_location":{"id":"doi:10.1145/3607541.3616817","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1145/3607541.3616817","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3607541.3616817","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 1st International Workshop on Multimedia Content Generation and Evaluation: New Methods and Practice","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3607541.3616817","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5090243913","display_name":"Xuezhi Tong","orcid":"https://orcid.org/0009-0005-2309-6409"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xuezhi Tong","raw_affiliation_strings":["Tianjin University, Tianjin, China"],"raw_orcid":"https://orcid.org/0009-0005-2309-6409","affiliations":[{"raw_affiliation_string":"Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013812973","display_name":"Lihua Jing","orcid":"https://orcid.org/0009-0005-6369-7890"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210156404","display_name":"Institute of Information Engineering","ror":"https://ror.org/04r53se39","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210156404"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lihua Jing","raw_affiliation_strings":["Institute of Information Engineering, Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0005-6369-7890","affiliations":[{"raw_affiliation_string":"Institute of Information Engineering, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210156404","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066214523","display_name":"C.L. Zou","orcid":"https://orcid.org/0000-0002-1901-5363"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210156404","display_name":"Institute of Information Engineering","ror":"https://ror.org/04r53se39","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210156404"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cong Zou","raw_affiliation_strings":["Institute of Information Engineering, Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-1901-5363","affiliations":[{"raw_affiliation_string":"Institute of Information Engineering, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210156404","https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100431257","display_name":"Rui Wang","orcid":"https://orcid.org/0009-0003-8935-3119"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210156404","display_name":"Institute of Information Engineering","ror":"https://ror.org/04r53se39","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210156404"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rui Wang","raw_affiliation_strings":["Institute of Information Engineering, Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-4792-1945","affiliations":[{"raw_affiliation_string":"Institute of Information Engineering, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210156404","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5090243913"],"corresponding_institution_ids":["https://openalex.org/I162868743"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.12706533,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"201","issue":null,"first_page":"105","last_page":"113"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ambiguity","display_name":"Ambiguity","score":0.7159818410873413},{"id":"https://openalex.org/keywords/predicate","display_name":"Predicate (mathematical logic)","score":0.6922152638435364},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6876504421234131},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5302229523658752},{"id":"https://openalex.org/keywords/scene-graph","display_name":"Scene graph","score":0.5110639333724976},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.48770222067832947},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.43149879574775696},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.42513972520828247},{"id":"https://openalex.org/keywords/contradiction","display_name":"Contradiction","score":0.41039279103279114},{"id":"https://openalex.org/keywords/rendering","display_name":"Rendering (computer graphics)","score":0.1007203459739685}],"concepts":[{"id":"https://openalex.org/C2780522230","wikidata":"https://www.wikidata.org/wiki/Q1140419","display_name":"Ambiguity","level":2,"score":0.7159818410873413},{"id":"https://openalex.org/C140146324","wikidata":"https://www.wikidata.org/wiki/Q1144319","display_name":"Predicate (mathematical logic)","level":2,"score":0.6922152638435364},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6876504421234131},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5302229523658752},{"id":"https://openalex.org/C179372163","wikidata":"https://www.wikidata.org/wiki/Q1406181","display_name":"Scene graph","level":3,"score":0.5110639333724976},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.48770222067832947},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.43149879574775696},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.42513972520828247},{"id":"https://openalex.org/C2776728590","wikidata":"https://www.wikidata.org/wiki/Q363948","display_name":"Contradiction","level":2,"score":0.41039279103279114},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.1007203459739685},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3607541.3616817","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1145/3607541.3616817","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3607541.3616817","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 1st International Workshop on Multimedia Content Generation and Evaluation: New Methods and Practice","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3607541.3616817","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1145/3607541.3616817","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3607541.3616817","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 1st International Workshop on Multimedia Content Generation and Evaluation: New Methods and Practice","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G34267490","display_name":null,"funder_award_id":"62176253","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4857597087","display_name":null,"funder_award_id":"No.62176253, No.U20B2066","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5566207747","display_name":null,"funder_award_id":"U20B2066","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4387698214.pdf","grobid_xml":"https://content.openalex.org/works/W4387698214.grobid-xml"},"referenced_works_count":6,"referenced_works":["https://openalex.org/W2186222003","https://openalex.org/W2277195237","https://openalex.org/W2565639579","https://openalex.org/W4312936847","https://openalex.org/W4386075638","https://openalex.org/W4386075828"],"related_works":["https://openalex.org/W2381825231","https://openalex.org/W2377933838","https://openalex.org/W2348916262","https://openalex.org/W4210310594","https://openalex.org/W2330422317","https://openalex.org/W2354224618","https://openalex.org/W2354172502","https://openalex.org/W2391836570","https://openalex.org/W2361796009","https://openalex.org/W2966204614"],"abstract_inverted_index":{"Recent":[0],"works":[1],"on":[2,10,24,280,295],"Scene":[3],"Graph":[4,261],"Generation":[5],"(SGG)":[6],"have":[7],"been":[8],"concentrating":[9],"solving":[11],"the":[12,25,31,34,43,49,52,57,62,83,121,125,134,145,155,161,166,176,183,190,198,225,229,233,247,267,281,292,296],"problem":[13],"of":[14,33,59,80,105,124,128,175,250,253],"long-tailed":[15],"distribution.":[16],"While":[17],"these":[18],"methods":[19],"are":[20,67,85,118,263],"making":[21],"significant":[22],"improvements":[23],"tail":[26],"predicate":[27,234,254],"categories,":[28],"they":[29],"sacrifice":[30],"performance":[32,294],"head":[35],"ones":[36],"severely.":[37],"The":[38,65],"major":[39],"issue":[40],"lies":[41],"in":[42,61,103,204,236],"semantic":[44,156],"ambiguity":[45],"problem,":[46],"which":[47,72,188],"is":[48,102,113,130,136,221,243],"contradiction":[50],"between":[51,77],"commonly":[53],"used":[54,264],"criterion":[55],"and":[56,89,196,202,259,299],"nature":[58],"relationships":[60,84,146],"SGG":[63,297],"datasets.":[64],"models":[66],"evaluated":[68],"with":[69],"graph":[70],"constraint,":[71],"allows":[73],"merely":[74],"one":[75,174],"relationship":[76],"a":[78,100,106,205,301],"pair":[79],"objects.":[81],"However,":[82],"much":[86],"more":[87],"complex":[88],"can":[90,109,210,289],"always":[91],"be":[92,133,148,211],"described":[93],"from":[94,150],"different":[95,122,237,251],"views.":[96],"For":[97],"example,":[98],"when":[99],"man":[101],"front":[104],"computer,":[107],"we":[108,142,181],"also":[110],"say":[111],"he":[112],"watching":[114],"it.":[115],"Both":[116],"options":[117],"plausible,":[119],"describing":[120],"aspects":[123],"relationship.":[126],"Which":[127],"them":[129],"determined":[131],"to":[132,153,172,200,223,228,245,265,269,273],"ground-truth":[135],"highly":[137],"subjective.":[138],"In":[139,158],"this":[140,179],"paper,":[141],"claim":[143],"that":[144,286],"should":[147,163],"considered":[149],"multiple":[151,194],"views":[152,195,252],"avoid":[154],"ambiguity.":[157],"other":[159],"words,":[160],"model":[162,199,226,268,293],"provide":[164,270],"all":[165],"possibilities,":[167],"rather":[168],"than":[169],"being":[170],"biased":[171],"any":[173],"options.":[177],"To":[178],"end,":[180],"propose":[182],"Multi-View":[184,239,256,260],"Predicate":[185,220,240,257],"Recognition":[186],"(MVPR),":[187],"separates":[189],"label":[191],"set":[192],"into":[193,213],"enables":[197],"represent":[201],"predict":[203],"\"multi-view''":[206],"style.":[207],"Specifically,":[208],"MVPR":[209,288],"divided":[212],"three":[214],"parts:":[215],"Adaptive":[216],"Bounding":[217],"Box":[218],"for":[219,232],"proposed":[222],"help":[224],"attend":[227],"crucial":[230],"areas":[231],"categories":[235],"views;":[238],"Feature":[241],"Learning":[242],"designed":[244],"separate":[246],"feature":[248],"space":[249],"categories;":[255],"Prediction":[258],"Constraint":[262],"allow":[266],"multi-view":[271],"predictions":[272],"accurately":[274],"estimate":[275],"ambiguous":[276],"relationships.":[277],"Experimental":[278],"results":[279],"Visual":[282],"Genome":[283],"dataset":[284],"show":[285],"our":[287],"significantly":[290],"improve":[291],"task,":[298],"achieves":[300],"new":[302],"state-of-the-art.":[303]},"counts_by_year":[],"updated_date":"2025-12-25T23:11:45.687758","created_date":"2025-10-10T00:00:00"}
