{"id":"https://openalex.org/W4416798770","doi":"https://doi.org/10.1109/apsipaasc65261.2025.11249403","title":"Neural Implicit Representations for Object-Centric Machine Vision Tasks","display_name":"Neural Implicit Representations for Object-Centric Machine Vision Tasks","publication_year":2025,"publication_date":"2025-10-22","ids":{"openalex":"https://openalex.org/W4416798770","doi":"https://doi.org/10.1109/apsipaasc65261.2025.11249403"},"language":null,"primary_location":{"id":"doi:10.1109/apsipaasc65261.2025.11249403","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipaasc65261.2025.11249403","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Yeoneui Kim","orcid":null},"institutions":[{"id":"https://openalex.org/I138925566","display_name":"Ewha Womans University","ror":"https://ror.org/053fp5c05","country_code":"KR","type":"education","lineage":["https://openalex.org/I138925566"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Yeoneui Kim","raw_affiliation_strings":["Ewha Womans University,Department of Electronic and Electrical Engineering,South Korea"],"affiliations":[{"raw_affiliation_string":"Ewha Womans University,Department of Electronic and Electrical Engineering,South Korea","institution_ids":["https://openalex.org/I138925566"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039192390","display_name":"Je\u2010Won Kang","orcid":"https://orcid.org/0000-0002-1637-9479"},"institutions":[{"id":"https://openalex.org/I138925566","display_name":"Ewha Womans University","ror":"https://ror.org/053fp5c05","country_code":"KR","type":"education","lineage":["https://openalex.org/I138925566"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Je-Won Kang","raw_affiliation_strings":["Ewha Womans University,Department of Electronic and Electrical Engineering,South Korea"],"affiliations":[{"raw_affiliation_string":"Ewha Womans University,Department of Electronic and Electrical Engineering,South Korea","institution_ids":["https://openalex.org/I138925566"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I138925566"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.36616185,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"2442","last_page":"2447"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.27129998803138733,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.27129998803138733,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.20020000636577606,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.08980000019073486,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/codec","display_name":"Codec","score":0.598800003528595},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5515000224113464},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.5095000267028809},{"id":"https://openalex.org/keywords/coding","display_name":"Coding (social sciences)","score":0.4228000044822693},{"id":"https://openalex.org/keywords/machine-vision","display_name":"Machine vision","score":0.3977000117301941},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.3953999876976013},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.3944999873638153},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.3686999976634979}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.817300021648407},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6140000224113464},{"id":"https://openalex.org/C161765866","wikidata":"https://www.wikidata.org/wiki/Q184748","display_name":"Codec","level":2,"score":0.598800003528595},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5515000224113464},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.5095000267028809},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.45570001006126404},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4546999931335449},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.4228000044822693},{"id":"https://openalex.org/C5339829","wikidata":"https://www.wikidata.org/wiki/Q1425977","display_name":"Machine vision","level":2,"score":0.3977000117301941},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.3953999876976013},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.3944999873638153},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.3686999976634979},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.3671000003814697},{"id":"https://openalex.org/C180016635","wikidata":"https://www.wikidata.org/wiki/Q2712821","display_name":"Compression (physics)","level":2,"score":0.33629998564720154},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.33570000529289246},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.31859999895095825},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2624000012874603},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.26019999384880066},{"id":"https://openalex.org/C146047270","wikidata":"https://www.wikidata.org/wiki/Q469666","display_name":"Human\u2013machine system","level":2,"score":0.25529998540878296},{"id":"https://openalex.org/C153338461","wikidata":"https://www.wikidata.org/wiki/Q2651","display_name":"Arithmetic coding","level":4,"score":0.25519999861717224},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.2549999952316284},{"id":"https://openalex.org/C25797200","wikidata":"https://www.wikidata.org/wiki/Q828137","display_name":"Compression ratio","level":3,"score":0.25049999356269836}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/apsipaasc65261.2025.11249403","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipaasc65261.2025.11249403","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1647613411","display_name":null,"funder_award_id":"IITP-2025-RS-2020-II201460","funder_id":"https://openalex.org/F4320324891","funder_display_name":"Iran Telecommunication Research Center"}],"funders":[{"id":"https://openalex.org/F4320324891","display_name":"Iran Telecommunication Research Center","ror":"https://ror.org/01a3g2z22"},{"id":"https://openalex.org/F4320328359","display_name":"Ministry of Science and ICT, South Korea","ror":"https://ror.org/01wpjm123"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W2060108852","https://openalex.org/W2505609860","https://openalex.org/W3040479127","https://openalex.org/W3096609285","https://openalex.org/W3169367294","https://openalex.org/W3202918664","https://openalex.org/W3204647170","https://openalex.org/W4312493191","https://openalex.org/W4376130027","https://openalex.org/W4386065618","https://openalex.org/W4386076325","https://openalex.org/W4390874575","https://openalex.org/W4391974577","https://openalex.org/W4402915458","https://openalex.org/W4404600503","https://openalex.org/W4404719129"],"related_works":[],"abstract_inverted_index":{"Video":[0],"Coding":[1],"for":[2,20,36,57,156],"Machines":[3],"(VCM)":[4],"has":[5],"become":[6],"increasingly":[7],"important":[8],"with":[9],"the":[10,17,74,136],"rapid":[11],"growth":[12],"of":[13],"video":[14,105],"data":[15],"and":[16,39,107,119,149],"rising":[18],"demand":[19],"machine":[21,58,108],"vision":[22,109],"systems":[23],"that":[24],"require":[25],"high":[26],"accuracy":[27,118,147],"under":[28],"low-bitrate":[29,137],"constraints.":[30],"Implicit":[31],"Neural":[32],"Representations":[33],"(INRs),":[34],"known":[35],"their":[37],"compactness":[38],"strong":[40],"compression":[41,106],"ability,":[42],"offer":[43],"a":[44,52,84],"promising":[45],"direction.":[46],"In":[47],"this":[48],"paper,":[49],"we":[50],"propose":[51],"novel":[53],"INR":[54,62,101],"framework":[55],"tailored":[56],"vision.":[59],"Unlike":[60],"prior":[61],"methods":[63],"focused":[64],"on":[65,88],"human":[66],"perception,":[67],"our":[68],"model":[69],"embeds":[70],"object-aware":[71,93],"information":[72],"into":[73],"neural":[75],"network.":[76],"Specifically,":[77],"decoder":[78],"weights":[79],"are":[80],"dynamically":[81],"generated":[82],"using":[83],"dynamic":[85],"network":[86],"conditioned":[87],"object-centric":[89],"latent":[90],"codes,":[91],"enabling":[92],"reconstruction.":[94],"Experiments":[95],"show":[96],"consistent":[97],"improvements":[98],"across":[99],"various":[100],"baselines":[102],"in":[103,124,135],"both":[104],"tasks.":[110],"Our":[111],"method":[112],"achieves":[113],"up":[114],"to":[115,128],"6%":[116,146],"higher":[117],"over":[120,145],"60%":[121],"bitrate":[122,151],"reduction":[123],"object":[125],"detection":[126],"compared":[127],"baselines,":[129],"even":[130],"outperforming":[131],"recent":[132],"standard":[133],"codecs":[134],"regime.":[138],"For":[139],"semantic":[140],"segmentation,":[141],"it":[142],"also":[143],"yields":[144],"gains":[148],"notable":[150],"savings,":[152],"demonstrating":[153],"its":[154],"effectiveness":[155],"VCM.":[157]},"counts_by_year":[],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-11-28T00:00:00"}
