{"id":"https://openalex.org/W4415708157","doi":"https://doi.org/10.1109/icme59968.2025.11209235","title":"Visual Relationships Are Different: Appropriate Way To Predict Each Relationship","display_name":"Visual Relationships Are Different: Appropriate Way To Predict Each Relationship","publication_year":2025,"publication_date":"2025-06-30","ids":{"openalex":"https://openalex.org/W4415708157","doi":"https://doi.org/10.1109/icme59968.2025.11209235"},"language":null,"primary_location":{"id":"doi:10.1109/icme59968.2025.11209235","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme59968.2025.11209235","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111279478","display_name":"Zhenhua Lei","orcid":null},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhenhua Lei","raw_affiliation_strings":["Xidian University,School of Artificial Intelligence,Xi&#x2019;an,China"],"affiliations":[{"raw_affiliation_string":"Xidian University,School of Artificial Intelligence,Xi&#x2019;an,China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100458706","display_name":"Xuemei Xie","orcid":"https://orcid.org/0000-0001-7857-0845"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuemei Xie","raw_affiliation_strings":["Xidian University,School of Artificial Intelligence,Xi&#x2019;an,China"],"affiliations":[{"raw_affiliation_string":"Xidian University,School of Artificial Intelligence,Xi&#x2019;an,China","institution_ids":["https://openalex.org/I149594827"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5111279478"],"corresponding_institution_ids":["https://openalex.org/I149594827"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.33753558,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.7817999720573425,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.7817999720573425,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.11420000344514847,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.013399999588727951,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.4950999915599823},{"id":"https://openalex.org/keywords/possessive","display_name":"Possessive","score":0.45730000734329224},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.39820000529289246},{"id":"https://openalex.org/keywords/visual-perception","display_name":"Visual perception","score":0.3578999936580658},{"id":"https://openalex.org/keywords/visual-objects","display_name":"Visual Objects","score":0.3424000144004822},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.33500000834465027}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6312000155448914},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5975000262260437},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.4950999915599823},{"id":"https://openalex.org/C120926136","wikidata":"https://www.wikidata.org/wiki/Q2105891","display_name":"Possessive","level":2,"score":0.45730000734329224},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.39820000529289246},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.39809998869895935},{"id":"https://openalex.org/C178253425","wikidata":"https://www.wikidata.org/wiki/Q162668","display_name":"Visual perception","level":3,"score":0.3578999936580658},{"id":"https://openalex.org/C2780103172","wikidata":"https://www.wikidata.org/wiki/Q1309721","display_name":"Visual Objects","level":3,"score":0.3424000144004822},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33719998598098755},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.33500000834465027},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.31049999594688416},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3075000047683716},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.2913999855518341},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2831999957561493},{"id":"https://openalex.org/C58166","wikidata":"https://www.wikidata.org/wiki/Q224821","display_name":"Fuzzy logic","level":2,"score":0.2660999894142151},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.2653999924659729},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.26159998774528503},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.25839999318122864}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icme59968.2025.11209235","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme59968.2025.11209235","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W2277195237","https://openalex.org/W2549139847","https://openalex.org/W2579549467","https://openalex.org/W2607855566","https://openalex.org/W2963514444","https://openalex.org/W2963536419","https://openalex.org/W2963649796","https://openalex.org/W2963938081","https://openalex.org/W2964080601","https://openalex.org/W2964225075","https://openalex.org/W2981820283","https://openalex.org/W3034538190","https://openalex.org/W3035017890","https://openalex.org/W3081642947","https://openalex.org/W3108864070","https://openalex.org/W3181556077","https://openalex.org/W4288083516","https://openalex.org/W4312682661","https://openalex.org/W4313161463","https://openalex.org/W4382458076","https://openalex.org/W4386075638","https://openalex.org/W4393154528","https://openalex.org/W4402727514","https://openalex.org/W4410955399"],"related_works":[],"abstract_inverted_index":{"Visual":[0],"relationships":[1,27],"are":[2],"different,":[3],"and":[4,28,77,80],"their":[5],"types":[6,24,107],"play":[7],"an":[8,75,83],"important":[9],"role":[10],"in":[11],"visual":[12,26,36,61,110],"scene":[13],"understanding.":[14],"However,":[15],"most":[16],"of":[17,25,44],"the":[18,22,30,42,45,66,69,72,78,105],"existing":[19],"works":[20],"ignore":[21],"different":[23,100],"adopt":[29],"unified":[31],"approach":[32,116],"to":[33,104,108],"learn":[34],"all":[35],"relationships.":[37,111],"It":[38],"not":[39],"only":[40],"limits":[41],"flexibility":[43],"model,":[46],"but":[47],"also":[48],"causes":[49],"fuzzy":[50],"relationship":[51,62,106],"representation.":[52],"To":[53],"address":[54],"this":[55],"problem,":[56],"we":[57,88],"deeply":[58],"study":[59],"four":[60],"types.":[63],"Among":[64],"them,":[65],"geometric":[67],"reflects":[68,74],"spatial":[70],"interaction,":[71],"semantic":[73],"action,":[76],"possessive":[79],"misc":[81],"indicates":[82],"intrinsic":[84],"correlation.":[85],"And":[86],"then,":[87],"propose":[89],"a":[90],"novel":[91],"method-":[92],"Types":[93],"Determine":[94],"Methods":[95],"(TDM)":[96],"-":[97],"which":[98],"designs":[99],"learning":[101],"strategies":[102],"according":[103],"infer":[109],"Experiments":[112],"demonstrate":[113],"that":[114],"our":[115],"achieves":[117],"superior":[118],"or":[119],"competitive":[120],"performance":[121],"over":[122],"previous":[123],"methods,":[124],"validating":[125],"its":[126],"effectiveness.":[127]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-30T00:00:00"}
