{"id":"https://openalex.org/W4404295200","doi":"https://doi.org/10.1109/mmsp61759.2024.10743493","title":"LAM3D: Leveraging Attention for Monocular 3D Object Detection","display_name":"LAM3D: Leveraging Attention for Monocular 3D Object Detection","publication_year":2024,"publication_date":"2024-10-02","ids":{"openalex":"https://openalex.org/W4404295200","doi":"https://doi.org/10.1109/mmsp61759.2024.10743493"},"language":"en","primary_location":{"id":"doi:10.1109/mmsp61759.2024.10743493","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/mmsp61759.2024.10743493","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE 26th International Workshop on Multimedia Signal Processing (MMSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5048403990","display_name":"Sas Diana Monica","orcid":"https://orcid.org/0009-0002-0735-0970"},"institutions":[{"id":"https://openalex.org/I158333966","display_name":"Technical University of Cluj-Napoca","ror":"https://ror.org/03r8nwp71","country_code":"RO","type":"education","lineage":["https://openalex.org/I158333966"]}],"countries":["RO"],"is_corresponding":true,"raw_author_name":"Diana-Alexandra Sas","raw_affiliation_strings":["Technical University of Cluj-Napoca,Faculty of Automation and Computer Science,Cluj-Napoca,Romania"],"affiliations":[{"raw_affiliation_string":"Technical University of Cluj-Napoca,Faculty of Automation and Computer Science,Cluj-Napoca,Romania","institution_ids":["https://openalex.org/I158333966"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5094101402","display_name":"Leandro Di Bella","orcid":"https://orcid.org/0009-0000-1731-7205"},"institutions":[{"id":"https://openalex.org/I13469542","display_name":"Vrije Universiteit Brussel","ror":"https://ror.org/006e5kg04","country_code":"BE","type":"education","lineage":["https://openalex.org/I13469542"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Leandro Di Bella","raw_affiliation_strings":["Vrije Universiteit Brussel, ETRO,Brussels,Belgium"],"affiliations":[{"raw_affiliation_string":"Vrije Universiteit Brussel, ETRO,Brussels,Belgium","institution_ids":["https://openalex.org/I13469542"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102878374","display_name":"Yangxintong Lyu","orcid":"https://orcid.org/0000-0002-2501-9010"},"institutions":[{"id":"https://openalex.org/I13469542","display_name":"Vrije Universiteit Brussel","ror":"https://ror.org/006e5kg04","country_code":"BE","type":"education","lineage":["https://openalex.org/I13469542"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Yangxintong Lyu","raw_affiliation_strings":["Vrije Universiteit Brussel, ETRO,Brussels,Belgium"],"affiliations":[{"raw_affiliation_string":"Vrije Universiteit Brussel, ETRO,Brussels,Belgium","institution_ids":["https://openalex.org/I13469542"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061493057","display_name":"Florin Oniga","orcid":"https://orcid.org/0000-0003-4875-2220"},"institutions":[{"id":"https://openalex.org/I158333966","display_name":"Technical University of Cluj-Napoca","ror":"https://ror.org/03r8nwp71","country_code":"RO","type":"education","lineage":["https://openalex.org/I158333966"]}],"countries":["RO"],"is_corresponding":false,"raw_author_name":"Florin Oniga","raw_affiliation_strings":["Technical University of Cluj-Napoca,Computer Science Department,Cluj-Napoca,Romania"],"affiliations":[{"raw_affiliation_string":"Technical University of Cluj-Napoca,Computer Science Department,Cluj-Napoca,Romania","institution_ids":["https://openalex.org/I158333966"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5088598176","display_name":"Adrian Munteanu","orcid":"https://orcid.org/0000-0001-7290-0428"},"institutions":[{"id":"https://openalex.org/I13469542","display_name":"Vrije Universiteit Brussel","ror":"https://ror.org/006e5kg04","country_code":"BE","type":"education","lineage":["https://openalex.org/I13469542"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Adrian Munteanu","raw_affiliation_strings":["Vrije Universiteit Brussel, ETRO,Brussels,Belgium"],"affiliations":[{"raw_affiliation_string":"Vrije Universiteit Brussel, ETRO,Brussels,Belgium","institution_ids":["https://openalex.org/I13469542"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5048403990"],"corresponding_institution_ids":["https://openalex.org/I158333966"],"apc_list":null,"apc_paid":null,"fwci":0.2632,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.56260432,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12111","display_name":"Industrial Vision Systems and Defect Detection","score":0.9832000136375427,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12702","display_name":"Brain Tumor Detection and Classification","score":0.9593999981880188,"subfield":{"id":"https://openalex.org/subfields/2808","display_name":"Neurology"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7493977546691895},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.6323449015617371},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.62364661693573},{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.6178098917007446},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6010798215866089},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5266249775886536},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.2433088719844818}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7493977546691895},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.6323449015617371},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.62364661693573},{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.6178098917007446},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6010798215866089},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5266249775886536},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2433088719844818}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/mmsp61759.2024.10743493","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/mmsp61759.2024.10743493","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE 26th International Workshop on Multimedia Signal Processing (MMSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W2108598243","https://openalex.org/W2150066425","https://openalex.org/W2963037989","https://openalex.org/W2963150697","https://openalex.org/W2963323244","https://openalex.org/W2963351448","https://openalex.org/W2963893349","https://openalex.org/W2982238751","https://openalex.org/W2989676862","https://openalex.org/W3035424742","https://openalex.org/W3094502228","https://openalex.org/W3131500599","https://openalex.org/W3138516171","https://openalex.org/W3175515048","https://openalex.org/W3204439495","https://openalex.org/W4280496682","https://openalex.org/W4286285640","https://openalex.org/W4312349930","https://openalex.org/W4312865155","https://openalex.org/W4319300623","https://openalex.org/W4386075853","https://openalex.org/W4386453674","https://openalex.org/W4390873008","https://openalex.org/W4398810114","https://openalex.org/W6620707391","https://openalex.org/W6769209158","https://openalex.org/W6838393215","https://openalex.org/W6868582632"],"related_works":["https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Since":[0],"the":[1,4,8,11,18,28,46,53,83,105,109,116,119,123,134,144],"introduction":[2],"of":[3,10,25,118,136],"self-attention":[5],"mechanism":[6,48,74],"and":[7,40,99,127],"adoption":[9],"Transformer":[12,92],"architecture":[13,146],"for":[14,32,52,75],"Computer":[15],"Vision":[16,19,91],"tasks,":[17],"Transformer-based":[20],"architectures":[21],"gained":[22],"a":[23,69,89],"lot":[24],"popularity":[26],"in":[27,49,122],"field,":[29],"being":[30],"used":[31],"tasks":[33],"such":[34],"as":[35,95],"image":[36,41],"classification,":[37],"object":[38,78],"detection":[39,101],"segmentation.":[42],"However,":[43],"efficiently":[44],"leveraging":[45],"attention":[47],"vision":[50],"transformers":[51],"Monocular":[54,76],"3D":[55,77,111],"Object":[56,112],"Detection":[57,113],"task":[58],"remains":[59],"an":[60],"open":[61],"question.":[62],"In":[63],"this":[64],"paper,":[65],"we":[66],"present":[67],"LAM3D,":[68],"framework":[70],"that":[71,147],"Leverages":[72],"self-Attention":[73],"Detection.":[79],"To":[80],"do":[81],"so,":[82],"proposed":[84,106,120],"method":[85,107],"is":[86,139],"built":[87],"upon":[88],"Pyramid":[90],"v2":[93],"(PVTv2)":[94],"feature":[96],"extraction":[97],"backbone":[98],"2D/3D":[100],"machinery.":[102],"We":[103],"evaluate":[104],"on":[108],"KITTI":[110],"Benchmark,":[114],"proving":[115],"applicability":[117],"solution":[121],"autonomous":[124],"driving":[125],"domain":[126],"outperforming":[128],"reference":[129],"methods.":[130],"Moreover,":[131],"due":[132],"to":[133,141],"usage":[135],"self-attention,":[137],"LAM3D":[138],"able":[140],"systematically":[142],"outperform":[143],"equivalent":[145],"does":[148],"not":[149],"employ":[150],"self-attention.":[151]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-23T23:11:35.936235","created_date":"2025-10-10T00:00:00"}
