{"id":"https://openalex.org/W2943248951","doi":"https://doi.org/10.1109/icpr48806.2021.9412945","title":"Improving Visual Relation Detection using Depth Maps","display_name":"Improving Visual Relation Detection using Depth Maps","publication_year":2021,"publication_date":"2021-01-10","ids":{"openalex":"https://openalex.org/W2943248951","doi":"https://doi.org/10.1109/icpr48806.2021.9412945","mag":"2943248951"},"language":"en","primary_location":{"id":"doi:10.1109/icpr48806.2021.9412945","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icpr48806.2021.9412945","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 25th International Conference on Pattern Recognition (ICPR)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1905.00966","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5039442998","display_name":"Sahand Sharifzadeh","orcid":null},"institutions":[{"id":"https://openalex.org/I8204097","display_name":"Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen","ror":"https://ror.org/05591te55","country_code":"DE","type":"education","lineage":["https://openalex.org/I8204097"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Sahand Sharifzadeh","raw_affiliation_strings":["Ludwig Maximilian University of Munich","Ludwig-Maximilian University of Munich"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Ludwig Maximilian University of Munich","institution_ids":["https://openalex.org/I8204097"]},{"raw_affiliation_string":"Ludwig-Maximilian University of Munich","institution_ids":["https://openalex.org/I8204097"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081679022","display_name":"Sina Moayed Baharlou","orcid":"https://orcid.org/0000-0003-0740-8570"},"institutions":[{"id":"https://openalex.org/I861853513","display_name":"Sapienza University of Rome","ror":"https://ror.org/02be6w209","country_code":"IT","type":"education","lineage":["https://openalex.org/I861853513"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Sina Moayed Baharlou","raw_affiliation_strings":["Sapienza University of Rome"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Sapienza University of Rome","institution_ids":["https://openalex.org/I861853513"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040144256","display_name":"Max Berrendorf","orcid":"https://orcid.org/0000-0001-9724-4009"},"institutions":[{"id":"https://openalex.org/I8204097","display_name":"Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen","ror":"https://ror.org/05591te55","country_code":"DE","type":"education","lineage":["https://openalex.org/I8204097"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Max Berrendorf","raw_affiliation_strings":["Ludwig Maximilian University of Munich","Ludwig-Maximilian University of Munich"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Ludwig Maximilian University of Munich","institution_ids":["https://openalex.org/I8204097"]},{"raw_affiliation_string":"Ludwig-Maximilian University of Munich","institution_ids":["https://openalex.org/I8204097"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047843370","display_name":"Rajat Koner","orcid":"https://orcid.org/0000-0003-3441-8192"},"institutions":[{"id":"https://openalex.org/I8204097","display_name":"Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen","ror":"https://ror.org/05591te55","country_code":"DE","type":"education","lineage":["https://openalex.org/I8204097"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Rajat Koner","raw_affiliation_strings":["Ludwig Maximilian University of Munich","Ludwig-Maximilian University of Munich"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Ludwig Maximilian University of Munich","institution_ids":["https://openalex.org/I8204097"]},{"raw_affiliation_string":"Ludwig-Maximilian University of Munich","institution_ids":["https://openalex.org/I8204097"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5074808403","display_name":"Volker Tresp","orcid":"https://orcid.org/0000-0001-9428-3686"},"institutions":[{"id":"https://openalex.org/I1325886976","display_name":"Siemens (Germany)","ror":"https://ror.org/059mq0909","country_code":"DE","type":"company","lineage":["https://openalex.org/I1325886976"]},{"id":"https://openalex.org/I8204097","display_name":"Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen","ror":"https://ror.org/05591te55","country_code":"DE","type":"education","lineage":["https://openalex.org/I8204097"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Volker Tresp","raw_affiliation_strings":["Ludwig Maximilian University of Munich &#x0026; Siemens AG","Ludwig Maximilian University of Munich & Siemens AG"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Ludwig Maximilian University of Munich &#x0026; Siemens AG","institution_ids":["https://openalex.org/I1325886976","https://openalex.org/I8204097"]},{"raw_affiliation_string":"Ludwig Maximilian University of Munich & Siemens AG","institution_ids":["https://openalex.org/I1325886976","https://openalex.org/I8204097"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.6792,"has_fulltext":true,"cited_by_count":9,"citation_normalized_percentile":{"value":0.69916614,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"3597","last_page":"3604"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/spatial-relation","display_name":"Spatial relation","score":0.7582532167434692},{"id":"https://openalex.org/keywords/relation","display_name":"Relation (database)","score":0.7241514921188354},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.6698378324508667},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.6694141626358032},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6620357632637024},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6305474042892456},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.6164612770080566},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.5781797766685486},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.567823588848114},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.537350058555603},{"id":"https://openalex.org/keywords/extension","display_name":"Extension (predicate logic)","score":0.532196044921875},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4972746670246124},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.481317400932312},{"id":"https://openalex.org/keywords/binary-relation","display_name":"Binary relation","score":0.4581647515296936},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.4196814000606537},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.39084291458129883},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3304857611656189},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2411176860332489},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.228569895029068}],"concepts":[{"id":"https://openalex.org/C27511587","wikidata":"https://www.wikidata.org/wiki/Q2178623","display_name":"Spatial relation","level":2,"score":0.7582532167434692},{"id":"https://openalex.org/C25343380","wikidata":"https://www.wikidata.org/wiki/Q277521","display_name":"Relation (database)","level":2,"score":0.7241514921188354},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.6698378324508667},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.6694141626358032},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6620357632637024},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6305474042892456},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.6164612770080566},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.5781797766685486},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.567823588848114},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.537350058555603},{"id":"https://openalex.org/C2778029271","wikidata":"https://www.wikidata.org/wiki/Q5421931","display_name":"Extension (predicate logic)","level":2,"score":0.532196044921875},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4972746670246124},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.481317400932312},{"id":"https://openalex.org/C65180967","wikidata":"https://www.wikidata.org/wiki/Q130901","display_name":"Binary relation","level":2,"score":0.4581647515296936},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.4196814000606537},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.39084291458129883},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3304857611656189},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2411176860332489},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.228569895029068},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/icpr48806.2021.9412945","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icpr48806.2021.9412945","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 25th International Conference on Pattern Recognition (ICPR)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1905.00966","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1905.00966","pdf_url":"https://arxiv.org/pdf/1905.00966","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"mag:2943248951","is_oa":true,"landing_page_url":"http://export.arxiv.org/pdf/1905.00966","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.1905.00966","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1905.00966","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1905.00966","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1905.00966","pdf_url":"https://arxiv.org/pdf/1905.00966","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5908723282","display_name":null,"funder_award_id":"01IS18050","funder_id":"https://openalex.org/F4320321114","funder_display_name":"Bundesministerium f\u00fcr Bildung und Forschung"}],"funders":[{"id":"https://openalex.org/F4320321114","display_name":"Bundesministerium f\u00fcr Bildung und Forschung","ror":"https://ror.org/04pz7b180"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2943248951.pdf"},"referenced_works_count":46,"referenced_works":["https://openalex.org/W125693051","https://openalex.org/W142212369","https://openalex.org/W205829674","https://openalex.org/W639708223","https://openalex.org/W1522301498","https://openalex.org/W1529533208","https://openalex.org/W1532325895","https://openalex.org/W1533230146","https://openalex.org/W1533861849","https://openalex.org/W1565402342","https://openalex.org/W1573897183","https://openalex.org/W1598866093","https://openalex.org/W1686810756","https://openalex.org/W2016753842","https://openalex.org/W2110917409","https://openalex.org/W2117539524","https://openalex.org/W2127426251","https://openalex.org/W2127795553","https://openalex.org/W2194775991","https://openalex.org/W2277195237","https://openalex.org/W2479423890","https://openalex.org/W2579549467","https://openalex.org/W2587989515","https://openalex.org/W2591644541","https://openalex.org/W2613718673","https://openalex.org/W2763058042","https://openalex.org/W2886970679","https://openalex.org/W2890814806","https://openalex.org/W2950133940","https://openalex.org/W2962737704","https://openalex.org/W2963432357","https://openalex.org/W2963536419","https://openalex.org/W2963591054","https://openalex.org/W2963956866","https://openalex.org/W3003588813","https://openalex.org/W3037161253","https://openalex.org/W3046075728","https://openalex.org/W6605121731","https://openalex.org/W6608344535","https://openalex.org/W6631943919","https://openalex.org/W6633727509","https://openalex.org/W6678830454","https://openalex.org/W6678846912","https://openalex.org/W6687483927","https://openalex.org/W6718112784","https://openalex.org/W6753998590"],"related_works":["https://openalex.org/W3162705930","https://openalex.org/W2591644541","https://openalex.org/W3212934559","https://openalex.org/W57867845","https://openalex.org/W3110034541","https://openalex.org/W3165215114","https://openalex.org/W597250640","https://openalex.org/W2503839561","https://openalex.org/W2806207967","https://openalex.org/W353806839","https://openalex.org/W2994893019","https://openalex.org/W2109584093","https://openalex.org/W2482549452","https://openalex.org/W2556366175","https://openalex.org/W2989664530","https://openalex.org/W1964874934","https://openalex.org/W2057753721","https://openalex.org/W2899414427","https://openalex.org/W2080938922","https://openalex.org/W2769252348"],"abstract_inverted_index":{"Visual":[0,91],"relation":[1,112,162],"detection":[2,113,163],"methods":[3],"rely":[4],"on":[5,33,70,139],"object":[6,34,65],"information":[7,32],"extracted":[8],"from":[9],"RGB":[10],"images":[11],"such":[12,44,52],"as":[13,45,53,87],"2D":[14],"bounding":[15],"boxes,":[16],"feature":[17],"maps,":[18,85],"and":[19,134],"predicted":[20],"class":[21],"probabilities.":[22],"We":[23,94],"argue":[24],"that":[25,97,145],"depth":[26,71,84,150],"maps":[27,151],"can":[28,164],"additionally":[29],"provide":[30],"valuable":[31],"relations,":[35,43,51],"e.g.":[36],"helping":[37],"to":[38,90,172],"detect":[39],"not":[40],"only":[41],"spatial":[42],"standing":[46],"behind,":[47],"but":[48],"also":[49,95],"non-spatial":[50],"holding.":[54],"In":[55],"this":[56,75,122],"work,":[57],"we":[58,77,124],"study":[59],"the":[60,99,158],"effect":[61],"of":[62,83,103,117,149,160,170],"using":[63,126],"different":[64],"features":[66],"with":[67],"a":[68,79,153,168],"focus":[69],"maps.":[72],"To":[73,120],"enable":[74],"study,":[76],"release":[78],"new":[80],"synthetic":[81],"dataset":[82],"VG-Depth,":[86],"an":[88,127],"extension":[89],"Genome":[92],"(VG).":[93],"note":[96],"given":[98],"highly":[100],"imbalanced":[101],"distribution":[102],"relations":[104],"in":[105],"VG,":[106],"typical":[107],"evaluation":[108],"metrics":[109],"for":[110],"visual":[111,161],"cannot":[114],"reveal":[115],"improvements":[116],"under-represented":[118],"relations.":[119],"address":[121],"problem,":[123],"propose":[125],"additional":[128],"metric,":[129],"calling":[130],"it":[131],"Macro":[132],"Recall@K,":[133],"demonstrate":[135],"its":[136],"remarkable":[137],"performance":[138,159],"VG.":[140],"Finally,":[141],"our":[142],"experiments":[143],"confirm":[144],"by":[146,167],"effective":[147],"utilization":[148],"within":[152],"simple,":[154],"yet":[155],"competitive":[156],"framework,":[157],"be":[165],"improved":[166],"margin":[169],"up":[171],"8%.":[173]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
