{"id":"https://openalex.org/W7129773208","doi":"https://doi.org/10.1109/icipw68931.2025.11386242","title":"A Novel Image Similarity Metric For Scene Composition Structure","display_name":"A Novel Image Similarity Metric For Scene Composition Structure","publication_year":2025,"publication_date":"2025-09-14","ids":{"openalex":"https://openalex.org/W7129773208","doi":"https://doi.org/10.1109/icipw68931.2025.11386242"},"language":null,"primary_location":{"id":"doi:10.1109/icipw68931.2025.11386242","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icipw68931.2025.11386242","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Image Processing Workshops (ICIPW)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126254447","display_name":"Md Redwanul Haque","orcid":null},"institutions":[{"id":"https://openalex.org/I149704539","display_name":"Deakin University","ror":"https://ror.org/02czsnj07","country_code":"AU","type":"education","lineage":["https://openalex.org/I149704539"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Md Redwanul Haque","raw_affiliation_strings":["Deakin University,School of Information Technology,Burwood,Victoria,Australia"],"affiliations":[{"raw_affiliation_string":"Deakin University,School of Information Technology,Burwood,Victoria,Australia","institution_ids":["https://openalex.org/I149704539"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126236237","display_name":"Manzur Murshed","orcid":null},"institutions":[{"id":"https://openalex.org/I149704539","display_name":"Deakin University","ror":"https://ror.org/02czsnj07","country_code":"AU","type":"education","lineage":["https://openalex.org/I149704539"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Manzur Murshed","raw_affiliation_strings":["Deakin University,School of Information Technology,Burwood,Victoria,Australia"],"affiliations":[{"raw_affiliation_string":"Deakin University,School of Information Technology,Burwood,Victoria,Australia","institution_ids":["https://openalex.org/I149704539"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120872003","display_name":"Manoranjan Paul","orcid":null},"institutions":[{"id":"https://openalex.org/I153230381","display_name":"Charles Sturt University","ror":"https://ror.org/00wfvh315","country_code":"AU","type":"education","lineage":["https://openalex.org/I153230381"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Manoranjan Paul","raw_affiliation_strings":["Charles Sturt University,School of Computing, Mathematics and Engineering,Bathurst,NSW,Australia"],"affiliations":[{"raw_affiliation_string":"Charles Sturt University,School of Computing, Mathematics and Engineering,Bathurst,NSW,Australia","institution_ids":["https://openalex.org/I153230381"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5018443733","display_name":"Tsz-Kwan Lee","orcid":"https://orcid.org/0000-0003-4176-2215"},"institutions":[{"id":"https://openalex.org/I149704539","display_name":"Deakin University","ror":"https://ror.org/02czsnj07","country_code":"AU","type":"education","lineage":["https://openalex.org/I149704539"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Tsz-Kwan Lee","raw_affiliation_strings":["Deakin University,School of Information Technology,Burwood,Victoria,Australia"],"affiliations":[{"raw_affiliation_string":"Deakin University,School of Information Technology,Burwood,Victoria,Australia","institution_ids":["https://openalex.org/I149704539"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5126254447"],"corresponding_institution_ids":["https://openalex.org/I149704539"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.7418138,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"446","last_page":"451"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.436599999666214,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.436599999666214,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.42559999227523804,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12650","display_name":"Aesthetic Perception and Analysis","score":0.07490000128746033,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.6930000185966492},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.6753000020980835},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.6132000088691711},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.5867000222206116},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5206999778747559},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.483599990606308},{"id":"https://openalex.org/keywords/monotonic-function","display_name":"Monotonic function","score":0.4278999865055084},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4244000017642975}],"concepts":[{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.6930000185966492},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.6753000020980835},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6468999981880188},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.6132000088691711},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6110000014305115},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.5867000222206116},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5206999778747559},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.483599990606308},{"id":"https://openalex.org/C72169020","wikidata":"https://www.wikidata.org/wiki/Q194404","display_name":"Monotonic function","level":2,"score":0.4278999865055084},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4244000017642975},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.3603000044822693},{"id":"https://openalex.org/C55020928","wikidata":"https://www.wikidata.org/wiki/Q3813865","display_name":"Image quality","level":3,"score":0.3422999978065491},{"id":"https://openalex.org/C2777382242","wikidata":"https://www.wikidata.org/wiki/Q6017816","display_name":"Index (typography)","level":2,"score":0.33899998664855957},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.32850000262260437},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.310699999332428},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.31040000915527344},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.3025999963283539},{"id":"https://openalex.org/C2776517306","wikidata":"https://www.wikidata.org/wiki/Q29017317","display_name":"Similarity measure","level":2,"score":0.2996000051498413},{"id":"https://openalex.org/C139489369","wikidata":"https://www.wikidata.org/wiki/Q770846","display_name":"Structural similarity","level":2,"score":0.28679999709129333},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.2818000018596649},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2775000035762787},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.2689000070095062},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.267300009727478},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.25589999556541443}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icipw68931.2025.11386242","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icipw68931.2025.11386242","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Image Processing Workshops (ICIPW)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5149847269058228,"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W1580389772","https://openalex.org/W2133665775","https://openalex.org/W2768814045","https://openalex.org/W2962785568","https://openalex.org/W3153469116","https://openalex.org/W3159357947","https://openalex.org/W3217655095","https://openalex.org/W4312652102","https://openalex.org/W4312933868","https://openalex.org/W4316660205","https://openalex.org/W4385801729","https://openalex.org/W4390873054","https://openalex.org/W4391974577"],"related_works":[],"abstract_inverted_index":{"The":[0],"rapid":[1],"advancement":[2],"of":[3,28,136,198],"generative":[4,193],"AI":[5],"models":[6,24],"necessitates":[7],"novel":[8],"methods":[9],"for":[10,22,57,163,181,189],"evaluating":[11,192],"image":[12,66],"quality":[13],"that":[14,122],"extend":[15],"beyond":[16],"human":[17,88],"perception.":[18],"A":[19],"critical":[20],"concern":[21],"these":[23],"is":[25,55],"the":[26,38,44,109,132,196],"preservation":[27,125],"an":[29,186],"image's":[30],"underlying":[31],"Scene":[32],"Composition":[33],"Structure":[34],"(SCS),":[35],"which":[36],"defines":[37],"geometric":[39],"relationships":[40],"among":[41],"objects":[42],"and":[43,60,103,118,191],"background,":[45],"their":[46],"relative":[47],"positions,":[48],"sizes,":[49],"orientations,":[50],"etc.":[51],"Maintaining":[52],"SCS":[53,110,124,169],"integrity":[54,197],"paramount":[56],"ensuring":[58,195],"faithful":[59],"structurally":[61],"accurate":[62],"GenAI":[63],"outputs.":[64],"Traditional":[65],"similarity":[67],"metrics":[68,86,99],"often":[69],"fall":[70],"short":[71],"in":[72],"assessing":[73],"SCS.":[74,155],"Pixel-level":[75],"approaches":[76],"are":[77],"overly":[78],"sensitive":[79],"to":[80,149,174],"minor":[81],"visual":[82],"noise,":[83],"while":[84],"perception-based":[85],"prioritize":[87],"aesthetic":[89],"appeal,":[90],"neither":[91],"adequately":[92],"capturing":[93,139],"structural":[94,141,182],"fidelity.":[95],"Furthermore,":[96],"recent":[97],"neural-network-based":[98],"introduce":[100,108],"training":[101,119],"overheads":[102],"potential":[104],"generalization":[105],"issues.":[106],"We":[107],"Similarity":[111],"Index":[112],"Measure":[113],"(SCSSIM),":[114],"a":[115,159],"novel,":[116],"analytical,":[117],"free":[120],"metric":[121],"quantifies":[123],"by":[126],"exploiting":[127],"statistical":[128],"measures":[129],"derived":[130],"from":[131],"Cuboidal":[133],"hierarchical":[134],"partitioning":[135],"images,":[137],"robustly":[138],"non-object-based":[140],"relationships.":[142],"Our":[143],"experiments":[144],"demonstrate":[145],"SCSSIM's":[146],"high":[147],"invariance":[148],"non-compositional":[150],"distortions,":[151,165],"accurately":[152],"reflecting":[153],"unchanged":[154],"Conversely,":[156],"it":[157,185],"shows":[158],"strong":[160],"monotonic":[161],"decrease":[162],"compositional":[164],"precisely":[166],"indicating":[167],"when":[168],"has":[170],"been":[171],"altered.":[172],"Compared":[173],"existing":[175],"metrics,":[176],"SCSSIM":[177],"exhibits":[178],"superior":[179],"properties":[180],"evaluation,":[183],"making":[184],"invaluable":[187],"tool":[188],"developing":[190],"models,":[194],"scene":[199],"composition.":[200]},"counts_by_year":[],"updated_date":"2026-02-19T06:27:42.648592","created_date":"2026-02-18T00:00:00"}
