{"id":"https://openalex.org/W7129579952","doi":"https://doi.org/10.1109/icipw68931.2025.11386259","title":"Scalable Human-Machine Image Coding Using Latent Space Triple Masking","display_name":"Scalable Human-Machine Image Coding Using Latent Space Triple Masking","publication_year":2025,"publication_date":"2025-09-14","ids":{"openalex":"https://openalex.org/W7129579952","doi":"https://doi.org/10.1109/icipw68931.2025.11386259"},"language":null,"primary_location":{"id":"doi:10.1109/icipw68931.2025.11386259","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icipw68931.2025.11386259","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Image Processing Workshops (ICIPW)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5068917647","display_name":"Haoyun Cheng","orcid":null},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Haoyun Cheng","raw_affiliation_strings":["University of Science and Technology of China"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology of China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029680806","display_name":"Hanyue Tu","orcid":"https://orcid.org/0000-0003-3705-1197"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hanyue Tu","raw_affiliation_strings":["University of Science and Technology of China"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology of China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126176419","display_name":"Li Li","orcid":null},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Li Li","raw_affiliation_strings":["University of Science and Technology of China"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology of China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5126221147","display_name":"Feng Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Feng Wu","raw_affiliation_strings":["University of Science and Technology of China"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology of China","institution_ids":["https://openalex.org/I126520041"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5068917647"],"corresponding_institution_ids":["https://openalex.org/I126520041"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.75450129,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"574","last_page":"579"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.6672999858856201,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.6672999858856201,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.08649999648332596,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.03669999912381172,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5353000164031982},{"id":"https://openalex.org/keywords/masking","display_name":"Masking (illustration)","score":0.48649999499320984},{"id":"https://openalex.org/keywords/human-visual-system-model","display_name":"Human visual system model","score":0.47450000047683716},{"id":"https://openalex.org/keywords/coding","display_name":"Coding (social sciences)","score":0.4595000147819519},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.41339999437332153},{"id":"https://openalex.org/keywords/partition","display_name":"Partition (number theory)","score":0.3889999985694885},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.3824000060558319},{"id":"https://openalex.org/keywords/visual-masking","display_name":"Visual masking","score":0.3732999861240387}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7365999817848206},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5353000164031982},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4964999854564667},{"id":"https://openalex.org/C2777402240","wikidata":"https://www.wikidata.org/wiki/Q6783436","display_name":"Masking (illustration)","level":2,"score":0.48649999499320984},{"id":"https://openalex.org/C160086991","wikidata":"https://www.wikidata.org/wiki/Q5939193","display_name":"Human visual system model","level":3,"score":0.47450000047683716},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.4595000147819519},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.41339999437332153},{"id":"https://openalex.org/C42812","wikidata":"https://www.wikidata.org/wiki/Q1082910","display_name":"Partition (number theory)","level":2,"score":0.3889999985694885},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.3824000060558319},{"id":"https://openalex.org/C2779200073","wikidata":"https://www.wikidata.org/wiki/Q18395575","display_name":"Visual masking","level":4,"score":0.3732999861240387},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3456999957561493},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.3377000093460083},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.32260000705718994},{"id":"https://openalex.org/C55020928","wikidata":"https://www.wikidata.org/wiki/Q3813865","display_name":"Image quality","level":3,"score":0.31779998540878296},{"id":"https://openalex.org/C13481523","wikidata":"https://www.wikidata.org/wiki/Q412438","display_name":"Image compression","level":4,"score":0.3107999861240387},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.3046000003814697},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3025999963283539},{"id":"https://openalex.org/C161765866","wikidata":"https://www.wikidata.org/wiki/Q184748","display_name":"Codec","level":2,"score":0.30079999566078186},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.28459998965263367},{"id":"https://openalex.org/C51167844","wikidata":"https://www.wikidata.org/wiki/Q4422623","display_name":"Latent variable","level":2,"score":0.27219998836517334},{"id":"https://openalex.org/C64543145","wikidata":"https://www.wikidata.org/wiki/Q162942","display_name":"Intersection (aeronautics)","level":2,"score":0.2694000005722046},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.25929999351501465},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.25369998812675476}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icipw68931.2025.11386259","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icipw68931.2025.11386259","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Image Processing Workshops (ICIPW)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W1861492603","https://openalex.org/W2962785568","https://openalex.org/W2981613960","https://openalex.org/W3034469748","https://openalex.org/W3138516171","https://openalex.org/W3186910762","https://openalex.org/W3209814877","https://openalex.org/W4284691924","https://openalex.org/W4312806968","https://openalex.org/W4386075611","https://openalex.org/W4387967955","https://openalex.org/W4403841811"],"related_works":[],"abstract_inverted_index":{"Most":[0],"existing":[1],"scalable":[2,54],"human-machine":[3,55],"image":[4,56],"coding":[5,57],"methods":[6,25],"are":[7],"optimized":[8],"for":[9,113,117,167],"pixel-wise":[10],"mean":[11],"squared":[12],"error,":[13],"which":[14,42],"do":[15],"not":[16,44],"accurately":[17],"represent":[18],"the":[19,29,91,103,127,157],"human":[20,76,168],"visual":[21,77],"system.":[22],"Besides,":[23],"these":[24,49],"typically":[26],"assume":[27],"that":[28,38,146],"information":[30,92],"required":[31,93],"by":[32,40,94,123],"machines":[33,95],"is":[34,43],"a":[35,53,82],"subset":[36],"of":[37],"needed":[39],"humans,":[41],"theoretically":[45],"guaranteed.":[46],"To":[47],"address":[48],"limitations,":[50],"we":[51,68,80,101],"propose":[52],"framework":[58],"with":[59,75,154],"latent":[60,104],"space":[61,105],"triple":[62,129],"masking":[63,130],"in":[64],"this":[65],"paper.":[66],"First,":[67],"utilize":[69],"perceptual":[70,165],"metrics":[71],"to":[72,137],"better":[73],"align":[74],"perception.":[78],"Then":[79],"adopt":[81],"more":[83],"universal":[84],"assumption:":[85],"there":[86],"exists":[87],"an":[88],"intersection":[89],"between":[90],"and":[96,120,141],"humans.":[97],"Based":[98],"on":[99],"this,":[100],"partition":[102],"into":[106,132],"three":[107,110],"parts":[108],"using":[109],"masks:":[111],"one":[112,116,121],"human-specific":[114],"information,":[115,119],"machine-specific":[118],"shared":[122],"both.":[124],"We":[125],"integrate":[126],"proposed":[128],"mechanism":[131],"two":[133],"representative":[134],"compression":[135],"models":[136],"validate":[138],"its":[139],"effectiveness":[140],"generality.":[142],"Experimental":[143],"results":[144],"demonstrate":[145],"our":[147],"method":[148],"achieves":[149],"significant":[150],"bitrate":[151],"savings":[152],"compared":[153],"benchmarks":[155],"under":[156],"same":[158],"machine":[159],"analysis":[160],"accuracy,":[161],"while":[162],"maintaining":[163],"high":[164],"quality":[166],"vision.":[169]},"counts_by_year":[],"updated_date":"2026-02-23T20:09:44.859080","created_date":"2026-02-18T00:00:00"}
