{"id":"https://openalex.org/W4414539348","doi":"https://doi.org/10.23919/mva65244.2025.11175105","title":"Statistic Temporal Checking and Depth Layering based Multi-Object Relative Size Estimation from Monocular Video","display_name":"Statistic Temporal Checking and Depth Layering based Multi-Object Relative Size Estimation from Monocular Video","publication_year":2025,"publication_date":"2025-07-26","ids":{"openalex":"https://openalex.org/W4414539348","doi":"https://doi.org/10.23919/mva65244.2025.11175105"},"language":"en","primary_location":{"id":"doi:10.23919/mva65244.2025.11175105","is_oa":false,"landing_page_url":"https://doi.org/10.23919/mva65244.2025.11175105","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 19th International Conference on Machine Vision and Applications (MVA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5054514747","display_name":"Ziyue Wang","orcid":"https://orcid.org/0009-0001-1783-4816"},"institutions":[{"id":"https://openalex.org/I150744194","display_name":"Waseda University","ror":"https://ror.org/00ntfnx83","country_code":"JP","type":"education","lineage":["https://openalex.org/I150744194"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Ziyue Wang","raw_affiliation_strings":["Waseda University,Japan"],"affiliations":[{"raw_affiliation_string":"Waseda University,Japan","institution_ids":["https://openalex.org/I150744194"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007867868","display_name":"Xina Cheng","orcid":"https://orcid.org/0000-0001-7319-1635"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xina Cheng","raw_affiliation_strings":["Xidian University,China"],"affiliations":[{"raw_affiliation_string":"Xidian University,China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5079405967","display_name":"Takeshi Ikenaga","orcid":"https://orcid.org/0000-0001-9022-0813"},"institutions":[{"id":"https://openalex.org/I150744194","display_name":"Waseda University","ror":"https://ror.org/00ntfnx83","country_code":"JP","type":"education","lineage":["https://openalex.org/I150744194"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Takeshi Ikenaga","raw_affiliation_strings":["Waseda University,Japan"],"affiliations":[{"raw_affiliation_string":"Waseda University,Japan","institution_ids":["https://openalex.org/I150744194"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5054514747"],"corresponding_institution_ids":["https://openalex.org/I150744194"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.27711018,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9883000254631042,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9793000221252441,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.7530999779701233},{"id":"https://openalex.org/keywords/outlier","display_name":"Outlier","score":0.6419000029563904},{"id":"https://openalex.org/keywords/layering","display_name":"Layering","score":0.6105999946594238},{"id":"https://openalex.org/keywords/statistic","display_name":"Statistic","score":0.5236999988555908},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.4869000017642975},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4465000033378601},{"id":"https://openalex.org/keywords/boundary","display_name":"Boundary (topology)","score":0.412200003862381}],"concepts":[{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.7530999779701233},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6827999949455261},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6621000170707703},{"id":"https://openalex.org/C79337645","wikidata":"https://www.wikidata.org/wiki/Q779824","display_name":"Outlier","level":2,"score":0.6419000029563904},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6254000067710876},{"id":"https://openalex.org/C176055353","wikidata":"https://www.wikidata.org/wiki/Q1402114","display_name":"Layering","level":2,"score":0.6105999946594238},{"id":"https://openalex.org/C89128539","wikidata":"https://www.wikidata.org/wiki/Q1949963","display_name":"Statistic","level":2,"score":0.5236999988555908},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.4869000017642975},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4465000033378601},{"id":"https://openalex.org/C62354387","wikidata":"https://www.wikidata.org/wiki/Q875399","display_name":"Boundary (topology)","level":2,"score":0.412200003862381},{"id":"https://openalex.org/C2779843651","wikidata":"https://www.wikidata.org/wiki/Q7390335","display_name":"SIGNAL (programming language)","level":2,"score":0.37599998712539673},{"id":"https://openalex.org/C158829959","wikidata":"https://www.wikidata.org/wiki/Q1640606","display_name":"Monocular vision","level":2,"score":0.34850001335144043},{"id":"https://openalex.org/C761482","wikidata":"https://www.wikidata.org/wiki/Q118093","display_name":"Transmission (telecommunications)","level":2,"score":0.32670000195503235},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.3215000033378601},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.26649999618530273},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.2630999982357025},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.262800008058548},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2614000141620636}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.23919/mva65244.2025.11175105","is_oa":false,"landing_page_url":"https://doi.org/10.23919/mva65244.2025.11175105","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 19th International Conference on Machine Vision and Applications (MVA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W1505952289","https://openalex.org/W2519379752","https://openalex.org/W2887751724","https://openalex.org/W2938672559","https://openalex.org/W2962777203","https://openalex.org/W2963892972","https://openalex.org/W3020500358","https://openalex.org/W3034597466","https://openalex.org/W3194668692","https://openalex.org/W3199149066","https://openalex.org/W4321770087","https://openalex.org/W4393147877","https://openalex.org/W4396216689","https://openalex.org/W4402727359"],"related_works":[],"abstract_inverted_index":{"Knowing":[0],"the":[1,37,60,78,98,115,121,129,136],"relative":[2,79],"3D":[3,50,122],"size":[4,38,61,80],"of":[5,39,48,62,100,117],"multiple":[6,82],"objects":[7,41,64,118],"in":[8,65],"a":[9,15],"complex":[10],"indoor":[11],"environment":[12],"gradually":[13],"becomes":[14],"significant":[16],"topic":[17],"for":[18,31],"robotics,":[19],"smart":[20],"room,":[21],"and":[22,52,73,102,119,135],"signal":[23],"transmission":[24],"applications.":[25],"However,":[26],"it":[27],"is":[28,88,138,143],"still":[29],"challenging":[30],"existing":[32],"vision":[33],"systems":[34],"to":[35,46,76,90,113,140],"estimate":[36,77],"different":[40,63],"from":[42],"monocular":[43],"videos":[44],"due":[45],"lack":[47],"enough":[49],"information":[51],"limited":[53],"object":[54,94],"detection":[55],"accuracy.":[56,124],"To":[57],"accurately":[58],"judge":[59],"videos,":[66],"this":[67],"paper":[68],"proposes":[69],"statistic":[70,85],"temporal":[71,86],"checking":[72,87,97],"depth":[74,106,109],"layering":[75,107],"between":[81],"objects.":[83],"Firstly,":[84],"used":[89],"remove":[91],"outliers":[92],"around":[93,144],"region":[95],"by":[96],"probability":[99],"foreground":[101],"background":[103],"region.":[104],"Secondly,":[105],"provides":[108],"prior,":[110],"which":[111,142],"helps":[112],"enhance":[114],"boundary":[116],"increases":[120],"reconstruction":[123],"Extensive":[125],"experiments":[126],"demonstrate":[127],"that":[128],"proposed":[130],"method":[131],"achieves":[132],"0.7958":[133],"accuracy,":[134],"error":[137],"reduced":[139],"0.0635,":[141],"20%":[145],"improved":[146],"on":[147],"average.":[148]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
