{"id":"https://openalex.org/W4405785168","doi":"https://doi.org/10.1109/iros58592.2024.10801473","title":"MARVIS: Motion &amp; Geometry Aware Real and Virtual Image Segmentation","display_name":"MARVIS: Motion &amp; Geometry Aware Real and Virtual Image Segmentation","publication_year":2024,"publication_date":"2024-10-14","ids":{"openalex":"https://openalex.org/W4405785168","doi":"https://doi.org/10.1109/iros58592.2024.10801473"},"language":"en","primary_location":{"id":"doi:10.1109/iros58592.2024.10801473","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros58592.2024.10801473","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5106236833","display_name":"Jiayi Wu","orcid":"https://orcid.org/0000-0001-9330-4836"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Jiayi Wu","raw_affiliation_strings":["University of Maryland,Maryland Robotics Center (MRC),College Park,MD,USA,20742"],"affiliations":[{"raw_affiliation_string":"University of Maryland,Maryland Robotics Center (MRC),College Park,MD,USA,20742","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101610451","display_name":"Xiaomin Lin","orcid":"https://orcid.org/0000-0002-9764-5168"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiaomin Lin","raw_affiliation_strings":["University of Maryland,Maryland Robotics Center (MRC),College Park,MD,USA,20742"],"affiliations":[{"raw_affiliation_string":"University of Maryland,Maryland Robotics Center (MRC),College Park,MD,USA,20742","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090868495","display_name":"S. Negahdaripour","orcid":"https://orcid.org/0000-0001-5676-5238"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shahriar Negahdaripour","raw_affiliation_strings":["University of Maryland,Maryland Robotics Center (MRC),College Park,MD,USA,20742"],"affiliations":[{"raw_affiliation_string":"University of Maryland,Maryland Robotics Center (MRC),College Park,MD,USA,20742","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083553427","display_name":"Cornelia Ferm\u00fcller","orcid":"https://orcid.org/0000-0003-2044-2386"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Cornelia Ferm\u00fcller","raw_affiliation_strings":["University of Maryland,Maryland Robotics Center (MRC),College Park,MD,USA,20742"],"affiliations":[{"raw_affiliation_string":"University of Maryland,Maryland Robotics Center (MRC),College Park,MD,USA,20742","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5036912867","display_name":"Yiannis Aloimonos","orcid":"https://orcid.org/0000-0002-8152-4281"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yiannis Aloimonos","raw_affiliation_strings":["University of Maryland,Maryland Robotics Center (MRC),College Park,MD,USA,20742"],"affiliations":[{"raw_affiliation_string":"University of Maryland,Maryland Robotics Center (MRC),College Park,MD,USA,20742","institution_ids":["https://openalex.org/I66946132"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5106236833"],"corresponding_institution_ids":["https://openalex.org/I66946132"],"apc_list":null,"apc_paid":null,"fwci":0.5263,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.68585735,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"2778","last_page":"2785"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10052","display_name":"Medical Image Segmentation Techniques","score":0.9915000200271606,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10052","display_name":"Medical Image Segmentation Techniques","score":0.9915000200271606,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9828000068664551,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9818000197410583,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.7303140759468079},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6484478712081909},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.5985599160194397},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5943436622619629},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.5628888010978699},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.5049536824226379},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.4722541868686676},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4463443458080292},{"id":"https://openalex.org/keywords/geometry","display_name":"Geometry","score":0.41434913873672485},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.14738360047340393}],"concepts":[{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7303140759468079},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6484478712081909},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.5985599160194397},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5943436622619629},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.5628888010978699},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.5049536824226379},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.4722541868686676},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4463443458080292},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.41434913873672485},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14738360047340393}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iros58592.2024.10801473","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros58592.2024.10801473","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1901129140","https://openalex.org/W2145451994","https://openalex.org/W2194775991","https://openalex.org/W2560023338","https://openalex.org/W2563150812","https://openalex.org/W2565639579","https://openalex.org/W2609883120","https://openalex.org/W2615547864","https://openalex.org/W2734349601","https://openalex.org/W2884585870","https://openalex.org/W2949223310","https://openalex.org/W3012984837","https://openalex.org/W3109908659","https://openalex.org/W3132455321","https://openalex.org/W3173433277","https://openalex.org/W3181199966","https://openalex.org/W3195589214","https://openalex.org/W3205562993","https://openalex.org/W3207717858","https://openalex.org/W3208145569","https://openalex.org/W4285102565","https://openalex.org/W4295934721","https://openalex.org/W4312121413","https://openalex.org/W4312364246","https://openalex.org/W4312814074","https://openalex.org/W4319336200","https://openalex.org/W4367839311","https://openalex.org/W4382397550","https://openalex.org/W4383109003","https://openalex.org/W4383109082","https://openalex.org/W4385485159","https://openalex.org/W4389543830","https://openalex.org/W4389543970","https://openalex.org/W4391422864","https://openalex.org/W6739696289","https://openalex.org/W6751420435","https://openalex.org/W6751733626","https://openalex.org/W6755437240","https://openalex.org/W6755977528","https://openalex.org/W6757817989","https://openalex.org/W6766978945","https://openalex.org/W7046211814"],"related_works":["https://openalex.org/W4379231730","https://openalex.org/W4389858081","https://openalex.org/W2501551404","https://openalex.org/W4298131179","https://openalex.org/W2113201962","https://openalex.org/W4385583601","https://openalex.org/W4395685956","https://openalex.org/W3159516372","https://openalex.org/W4398146871","https://openalex.org/W1522196789"],"abstract_inverted_index":{"Tasks":[0],"such":[1],"as":[2],"autonomous":[3],"navigation,":[4],"3D":[5],"reconstruction,":[6],"and":[7,30,40,51,63,112,127,158,188,198,220,250],"object":[8],"recognition":[9],"near":[10],"the":[11,33,80,91,141,149,159,169,172],"water":[12,173],"surfaces":[13],"are":[14,252],"crucial":[15],"in":[16,49,153,210],"marine":[17],"robotics":[18],"applications.":[19],"However,":[20],"challenges":[21],"arise":[22],"due":[23],"to":[24,46,59,137,184],"dynamic":[25],"disturbances,":[26],"e.g.,":[27],"light":[28,83],"reflections":[29],"refraction":[31],"from":[32],"random":[34],"air-water":[35],"interface,":[36],"irregular":[37],"liquid":[38],"flow,":[39],"similar":[41],"factors,":[42],"which":[43],"can":[44],"lead":[45],"potential":[47],"failures":[48],"perception":[50],"navigation":[52],"systems.":[53],"Traditional":[54],"computer":[55],"vision":[56],"algorithms":[57],"struggle":[58],"differentiate":[60],"between":[61,186],"real":[62,111,160,187,212],"virtual":[64,71,113,189],"image":[65,72,114,207],"regions,":[66,115],"significantly":[67],"complicating":[68],"tasks.":[69],"A":[70],"region":[73],"is":[74],"an":[75,94,216],"apparent":[76],"representation":[77],"formed":[78],"by":[79,147],"redirection":[81],"of":[82,93,171],"rays,":[84],"typically":[85],"through":[86,199],"reflection":[87],"or":[88],"refraction,":[89],"creating":[90,163],"illusion":[92],"object\u2019s":[95],"presence":[96],"without":[97],"its":[98],"actual":[99],"physical":[100],"location.":[101],"This":[102],"work":[103],"proposes":[104],"a":[105,123,221,229,243],"novel":[106],"approach":[107],"for":[108,180],"segmentation":[109,132,151,208],"on":[110,242],"exploiting":[116],"synthetic":[117,165],"images":[118,166,190],"combined":[119],"with":[120],"domain-invariant":[121],"information,":[122],"Motion":[124],"Entropy":[125],"Kernel,":[126],"Epipolar":[128],"Geometric":[129],"Consistency.":[130],"Our":[131,248],"network":[133,152,182],"does":[134],"not":[135],"need":[136],"be":[138],"re-trained":[139],"if":[140],"domain":[142],"changes.":[143],"We":[144],"show":[145],"this":[146],"deploying":[148],"same":[150],"two":[154],"different":[155],"domains:":[156],"simulation":[157],"world.":[161],"By":[162,192],"realistic":[164],"that":[167],"mimic":[168],"complexities":[170],"surface,":[174],"we":[175,203],"provide":[176],"fine-grained":[177],"training":[178],"data":[179],"our":[181],"(MARVIS)":[183],"discern":[185],"effectively.":[191],"motion":[193],"&":[194],"geometry-aware":[195],"design":[196],"choices":[197],"comprehensive":[200],"experimental":[201],"analysis,":[202],"achieve":[204],"state-of-the-art":[205],"real-virtual":[206],"performance":[209],"unseen":[211],"world":[213],"domain,":[214],"achieving":[215],"IoU":[217],"over":[218,225,235],"78%":[219],"F<inf":[222],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[223],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">1</inf>-Score":[224],"86%":[226],"while":[227],"ensuring":[228],"small":[230],"computational":[231],"footprint.":[232],"MARVIS":[233],"offers":[234],"43":[236],"FPS":[237],"(8":[238],"FPS)":[239],"inference":[240],"rates":[241],"single":[244],"GPU":[245],"(CPU":[246],"core).":[247],"code":[249],"dataset":[251],"available":[253],"here":[254],"https://github.com/jiayi-wu-umd/MARVIS.":[255]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2025-12-21T01:58:51.020947","created_date":"2025-10-10T00:00:00"}
