{"id":"https://openalex.org/W2965293215","doi":"https://doi.org/10.1109/wacv45572.2020.9093449","title":"Quadtree Generating Networks: Efficient Hierarchical Scene Parsing with Sparse Convolutions","display_name":"Quadtree Generating Networks: Efficient Hierarchical Scene Parsing with Sparse Convolutions","publication_year":2020,"publication_date":"2020-03-01","ids":{"openalex":"https://openalex.org/W2965293215","doi":"https://doi.org/10.1109/wacv45572.2020.9093449","mag":"2965293215"},"language":"en","primary_location":{"id":"doi:10.1109/wacv45572.2020.9093449","is_oa":false,"landing_page_url":"https://doi.org/10.1109/wacv45572.2020.9093449","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE Winter Conference on Applications of Computer Vision (WACV)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1907.11821","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041189908","display_name":"Kashyap Chitta","orcid":"https://orcid.org/0000-0002-3891-3230"},"institutions":[{"id":"https://openalex.org/I149899117","display_name":"Max Planck Society","ror":"https://ror.org/01hhn8329","country_code":"DE","type":"funder","lineage":["https://openalex.org/I149899117"]},{"id":"https://openalex.org/I8087733","display_name":"University of T\u00fcbingen","ror":"https://ror.org/03a1kwz48","country_code":"DE","type":"education","lineage":["https://openalex.org/I8087733"]},{"id":"https://openalex.org/I4210135521","display_name":"Max Planck Institute for Intelligent Systems","ror":"https://ror.org/04fq9j139","country_code":"DE","type":"facility","lineage":["https://openalex.org/I149899117","https://openalex.org/I4210135521"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Kashyap Chitta","raw_affiliation_strings":["Autonomous Vision Group, MPI for Intelligent Systems and University of T\u00fcbingen","Max-Planck-Society"],"affiliations":[{"raw_affiliation_string":"Autonomous Vision Group, MPI for Intelligent Systems and University of T\u00fcbingen","institution_ids":["https://openalex.org/I4210135521","https://openalex.org/I8087733"]},{"raw_affiliation_string":"Max-Planck-Society","institution_ids":["https://openalex.org/I149899117"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101540588","display_name":"Jos\u00e9 M. Alvarez","orcid":"https://orcid.org/0000-0002-7535-6322"},"institutions":[{"id":"https://openalex.org/I1304085615","display_name":"Nvidia (United Kingdom)","ror":"https://ror.org/02kr42612","country_code":"GB","type":"company","lineage":["https://openalex.org/I1304085615","https://openalex.org/I4210127875"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Jose M. Alvarez","raw_affiliation_strings":["NVIDIA","nVidia"],"affiliations":[{"raw_affiliation_string":"NVIDIA","institution_ids":[]},{"raw_affiliation_string":"nVidia","institution_ids":["https://openalex.org/I1304085615"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5075246991","display_name":"Martial Hebert","orcid":"https://orcid.org/0000-0003-4566-5930"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Martial Hebert","raw_affiliation_strings":["The Robotics Institute, Carnegie Mellon University","Carnegie Mellon University"],"affiliations":[{"raw_affiliation_string":"The Robotics Institute, Carnegie Mellon University","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Carnegie Mellon University","institution_ids":["https://openalex.org/I74973139"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5041189908"],"corresponding_institution_ids":["https://openalex.org/I149899117","https://openalex.org/I4210135521","https://openalex.org/I8087733"],"apc_list":null,"apc_paid":null,"fwci":0.1963,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.46818801,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"2009","last_page":"2018"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8088871240615845},{"id":"https://openalex.org/keywords/quadtree","display_name":"Quadtree","score":0.7535459995269775},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6692522764205933},{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.6532759666442871},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6489508152008057},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6487895250320435},{"id":"https://openalex.org/keywords/memory-footprint","display_name":"Memory footprint","score":0.5676981210708618},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5640320777893066},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5357446074485779},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5287565588951111},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4576283097267151},{"id":"https://openalex.org/keywords/footprint","display_name":"Footprint","score":0.4165664613246918},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.41044309735298157},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3813176453113556}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8088871240615845},{"id":"https://openalex.org/C151416825","wikidata":"https://www.wikidata.org/wiki/Q934791","display_name":"Quadtree","level":2,"score":0.7535459995269775},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6692522764205933},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.6532759666442871},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6489508152008057},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6487895250320435},{"id":"https://openalex.org/C74912251","wikidata":"https://www.wikidata.org/wiki/Q6815727","display_name":"Memory footprint","level":2,"score":0.5676981210708618},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5640320777893066},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5357446074485779},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5287565588951111},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4576283097267151},{"id":"https://openalex.org/C132943942","wikidata":"https://www.wikidata.org/wiki/Q2562511","display_name":"Footprint","level":2,"score":0.4165664613246918},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.41044309735298157},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3813176453113556},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/wacv45572.2020.9093449","is_oa":false,"landing_page_url":"https://doi.org/10.1109/wacv45572.2020.9093449","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE Winter Conference on Applications of Computer Vision (WACV)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1907.11821","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1907.11821","pdf_url":"https://arxiv.org/pdf/1907.11821","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.1907.11821","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1907.11821","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"},{"id":"mag:2965293215","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":null}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1907.11821","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1907.11821","pdf_url":"https://arxiv.org/pdf/1907.11821","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","score":0.7200000286102295,"id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2965293215.pdf"},"referenced_works_count":71,"referenced_works":["https://openalex.org/W1745334888","https://openalex.org/W1901129140","https://openalex.org/W1903029394","https://openalex.org/W1923184257","https://openalex.org/W1948751323","https://openalex.org/W1968033505","https://openalex.org/W2022508996","https://openalex.org/W2027097582","https://openalex.org/W2050576295","https://openalex.org/W2095844239","https://openalex.org/W2101897555","https://openalex.org/W2118246710","https://openalex.org/W2129085190","https://openalex.org/W2131396337","https://openalex.org/W2194775991","https://openalex.org/W2322480645","https://openalex.org/W2340897893","https://openalex.org/W2507296351","https://openalex.org/W2514564637","https://openalex.org/W2556802233","https://openalex.org/W2556967412","https://openalex.org/W2560023338","https://openalex.org/W2563705555","https://openalex.org/W2603429625","https://openalex.org/W2630837129","https://openalex.org/W2737258237","https://openalex.org/W2738804062","https://openalex.org/W2762439315","https://openalex.org/W2780664485","https://openalex.org/W2805395174","https://openalex.org/W2853336868","https://openalex.org/W2884822772","https://openalex.org/W2892219791","https://openalex.org/W2894608628","https://openalex.org/W2895340641","https://openalex.org/W2951001719","https://openalex.org/W2963091558","https://openalex.org/W2963182550","https://openalex.org/W2963403868","https://openalex.org/W2963577694","https://openalex.org/W2963727650","https://openalex.org/W2963840672","https://openalex.org/W2963881378","https://openalex.org/W2963896595","https://openalex.org/W2964309882","https://openalex.org/W2981689412","https://openalex.org/W6637566013","https://openalex.org/W6637891497","https://openalex.org/W6639824700","https://openalex.org/W6674793120","https://openalex.org/W6677322329","https://openalex.org/W6679960548","https://openalex.org/W6696085341","https://openalex.org/W6700594562","https://openalex.org/W6724670942","https://openalex.org/W6726094665","https://openalex.org/W6729983426","https://openalex.org/W6739696289","https://openalex.org/W6739901393","https://openalex.org/W6741613197","https://openalex.org/W6745447533","https://openalex.org/W6746034047","https://openalex.org/W6748481559","https://openalex.org/W6751727959","https://openalex.org/W6752606552","https://openalex.org/W6752673784","https://openalex.org/W6753421600","https://openalex.org/W6754713557","https://openalex.org/W6754852571","https://openalex.org/W6754921469","https://openalex.org/W6756709046"],"related_works":["https://openalex.org/W3009389287","https://openalex.org/W3128896552","https://openalex.org/W3107163670","https://openalex.org/W2944192542","https://openalex.org/W3180799285","https://openalex.org/W2924464923","https://openalex.org/W3174280965","https://openalex.org/W3032400974","https://openalex.org/W2953366231","https://openalex.org/W3151565285","https://openalex.org/W3211110855","https://openalex.org/W2912996616","https://openalex.org/W3009950151","https://openalex.org/W2949394278","https://openalex.org/W3120248555","https://openalex.org/W3102039465","https://openalex.org/W3048074310","https://openalex.org/W2952263313","https://openalex.org/W3080745716","https://openalex.org/W2339675515"],"abstract_inverted_index":{"Semantic":[0],"segmentation":[1,44,59],"with":[2,76,152],"Convolutional":[3],"Neural":[4],"Networks":[5,29],"is":[6,49,179],"a":[7,31,97,149,159,166],"memory-intensive":[8],"task":[9],"due":[10],"to":[11,35,50,53,106,115,148,165],"the":[12,38,55,77,88,113,126,132],"high":[13],"spatial":[14],"resolution":[15],"of":[16,41,62,72,128],"feature":[17],"maps":[18],"and":[19,57,109,135,156],"output":[20],"predictions.":[21],"In":[22,94],"this":[23],"paper,":[24],"we":[25,140],"present":[26],"Quadtree":[27],"Generating":[28],"(QGNs),":[30],"novel":[32],"approach":[33,130],"able":[34],"drastically":[36],"reduce":[37],"memory":[39,154,172],"footprint":[40],"modern":[42],"semantic":[43],"networks.":[45],"The":[46],"key":[47],"idea":[48],"use":[51],"quadtrees":[52],"represent":[54],"predictions":[56],"target":[58],"masks":[60],"instead":[61],"dense":[63],"pixel":[64],"grids.":[65],"Our":[66,177],"quadtree":[67],"representation":[68,101],"enables":[69,102],"hierarchical":[70],"processing":[71],"an":[73,142],"input":[74],"image,":[75],"most":[78],"computationally":[79],"demanding":[80],"layers":[81],"only":[82,157],"being":[83],"used":[84],"at":[85,181],"regions":[86],"in":[87,117],"image":[89],"containing":[90],"boundaries":[91],"between":[92],"classes.":[93],"addition,":[95],"given":[96],"trained":[98],"model,":[99],"our":[100,129],"flexible":[103],"inference":[104],"schemes":[105],"trade-off":[107],"accuracy":[108],"computational":[110],"cost,":[111],"allowing":[112],"network":[114,151],"adapt":[116],"constrained":[118],"situations":[119],"such":[120],"as":[121],"embedded":[122],"devices.":[123],"We":[124],"demonstrate":[125],"benefits":[127],"on":[131],"Cityscapes,":[133,139],"SUN-RGBD":[134],"ADE20k":[136],"datasets.":[137],"On":[138],"obtain":[141],"relative":[143,161],"3%":[144,160],"mIoU":[145,162],"improvement":[146],"compared":[147,164],"dilated":[150,168],"similar":[153],"consumption;":[155],"receive":[158],"drop":[163],"large":[167],"network,":[169],"while":[170],"reducing":[171],"consumption":[173],"by":[174],"over":[175],"4\u00d7.":[176],"code":[178],"available":[180],"https://github.com/kashyap7x/QGN.":[182]},"counts_by_year":[{"year":2023,"cited_by_count":2}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
