{"id":"https://openalex.org/W4376852236","doi":"https://doi.org/10.1145/3564121.3564137","title":"Unsupervised Early Exit in DNNs with Multiple Exits","display_name":"Unsupervised Early Exit in DNNs with Multiple Exits","publication_year":2022,"publication_date":"2022-10-12","ids":{"openalex":"https://openalex.org/W4376852236","doi":"https://doi.org/10.1145/3564121.3564137"},"language":"en","primary_location":{"id":"doi:10.1145/3564121.3564137","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3564121.3564137","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Second International Conference on AI-ML Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5046451920","display_name":"Hari Narayan N U","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hari Narayan N U","raw_affiliation_strings":["MLiONS Lab, IEOR, IIT Bombay, IN"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"MLiONS Lab, IEOR, IIT Bombay, IN","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057858044","display_name":"Manjesh K. Hanawal","orcid":"https://orcid.org/0000-0002-1807-5487"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Manjesh Kumar Hanawal","raw_affiliation_strings":["MLiONS Lab, IEOR, IIT Bombay, IN"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"MLiONS Lab, IEOR, IIT Bombay, IN","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5063861809","display_name":"Avinash Bhardwaj","orcid":"https://orcid.org/0000-0002-9690-1705"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Avinash Bhardwaj","raw_affiliation_strings":["Mechanical Engineering, IIT Bombay, IN"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Mechanical Engineering, IIT Bombay, IN","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.5069,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.70452799,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"9"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7527456283569336},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.7356798648834229},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.6534224152565002},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.5583535432815552},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5507661700248718},{"id":"https://openalex.org/keywords/differentiable-function","display_name":"Differentiable function","score":0.5010507106781006},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4582982659339905},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.4563825726509094},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4505312442779541},{"id":"https://openalex.org/keywords/ground-truth","display_name":"Ground truth","score":0.44657179713249207},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.4231884479522705},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3697112202644348},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.14833080768585205}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7527456283569336},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.7356798648834229},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.6534224152565002},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.5583535432815552},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5507661700248718},{"id":"https://openalex.org/C202615002","wikidata":"https://www.wikidata.org/wiki/Q783507","display_name":"Differentiable function","level":2,"score":0.5010507106781006},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4582982659339905},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.4563825726509094},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4505312442779541},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.44657179713249207},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.4231884479522705},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3697112202644348},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14833080768585205},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3564121.3564137","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3564121.3564137","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Second International Conference on AI-ML Systems","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W1516184288","https://openalex.org/W1987292194","https://openalex.org/W2108278040","https://openalex.org/W2168405694","https://openalex.org/W2602856279","https://openalex.org/W2750779823","https://openalex.org/W2962677625","https://openalex.org/W2980856918","https://openalex.org/W2990958518","https://openalex.org/W3035038672","https://openalex.org/W3045789554","https://openalex.org/W3049640275","https://openalex.org/W3094307698","https://openalex.org/W3102767875","https://openalex.org/W3102775700","https://openalex.org/W3130607817","https://openalex.org/W3191795420","https://openalex.org/W3208262036","https://openalex.org/W4225966323"],"related_works":["https://openalex.org/W4285277090","https://openalex.org/W4327738859","https://openalex.org/W2348722996","https://openalex.org/W2334570605","https://openalex.org/W3181683615","https://openalex.org/W2898767136","https://openalex.org/W2981583398","https://openalex.org/W4379251913","https://openalex.org/W3042419602","https://openalex.org/W2966649771"],"abstract_inverted_index":{"Deep":[0],"Neural":[1],"Networks":[2],"(DNNs)":[3],"are":[4,180],"generally":[5],"designed":[6],"as":[7,206],"sequentially":[8],"cascaded":[9],"differentiable":[10],"blocks/layers":[11],"with":[12,26,132],"a":[13,55,188,230,286],"prediction":[14,27,57,77],"module":[15],"connected":[16],"only":[17],"to":[18,103,161,217,234,248,288],"its":[19],"last":[20,50],"layer.":[21],"DNNs":[22,179],"can":[23,37],"be":[24,115,126,196],"attached":[25],"modules":[28],"at":[29,39,121,166],"multiple":[30],"points":[31,294],"along":[32],"the":[33,47,90,94,108,118,133,137,163,172,201,214,219,227,240,250,259,279],"backbone":[34],"where":[35],"inference":[36],"stop":[38],"an":[40,141,150,207,254],"intermediary":[41],"stage":[42],"without":[43,257],"passing":[44],"through":[45],"all":[46],"modules.":[48],"The":[49,83],"exit":[51,68,85,123,139,168,204,221,252,293],"point":[52,69,86,124,169],"may":[53,87,97,113,194],"offer":[54],"better":[56,175],"error":[58,78,119,164],"but":[59],"also":[60],"involves":[61],"more":[62],"computational":[63],"resources":[64],"and":[65,79,96,117,170,212,305],"latency.":[66],"An":[67],"that":[70,155,236,273],"is":[71,81,130,159],"\u2018optimal\u2019":[72],"in":[73,140,149,183,253,295],"terms":[74],"of":[75,93,111,135,191,203],"both":[76],"cost":[80],"desirable.":[82],"optimal":[84,138,220,251,292],"depend":[88],"on":[89,226,303],"latent":[91],"distribution":[92],"tasks":[95],"change":[98],"from":[99],"one":[100,129],"task":[101],"type":[102],"another.":[104],"During":[105],"neural":[106],"inference,":[107],"ground":[109,192,260],"truth":[110,193,261],"instances":[112],"not":[114,195],"available":[116,160],"rates":[120],"each":[122,167],"cannot":[125],"estimated.":[127],"Hence":[128],"faced":[131],"problem":[134,148,202,211],"selecting":[136],"unsupervised":[142,208],"setting.":[143],"Prior":[144],"works":[145],"tackled":[146],"this":[147],"offline":[151],"supervised":[152],"setting":[153],"assuming":[154],"enough":[156],"labeled":[157],"data":[158],"estimate":[162],"rate":[165],"tune":[171],"parameters":[173],"for":[174,186],"accuracy.":[176],"However,":[177],"pre-trained":[178,231],"often":[181],"deployed":[182],"new":[184],"domains":[185],"which":[187],"large":[189],"amount":[190],"available.":[197],"We":[198,263,298],"thus":[199],"model":[200],"selection":[205],"online":[209,255],"learning":[210],"leverage":[213],"bandit":[215],"theory":[216],"identify":[218],"point.":[222],"Specifically,":[223],"we":[224],"focus":[225],"Elastic":[228],"BERT,":[229],"multi-exit":[232,296],"DNN":[233],"demonstrate":[235],"it":[237,246],"\u2018nearly\u2019":[238],"satisfies":[239],"Strong":[241],"Dominance":[242],"(SD)":[243],"property":[244],"making":[245],"possible":[247],"learn":[249,290],"setup":[256],"knowing":[258],"labels.":[262],"develop":[264],"upper":[265],"confidence":[266],"bound":[267],"(UCB)":[268],"based":[269],"algorithm":[270,302],"named":[271],"UEE-UCB":[272],"provably":[274],"achieves":[275],"sub-linear":[276],"regret":[277],"under":[278],"SD":[280],"property.":[281],"Thus":[282],"our":[283,301],"method":[284],"provides":[285],"means":[287],"adaptively":[289],"domain-specific":[291],"DNNs.":[297],"empirically":[299],"validate":[300],"IMDb":[304],"Yelp":[306],"datasets.":[307]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
