{"id":"https://openalex.org/W7117130991","doi":"https://doi.org/10.1109/jiot.2025.3648047","title":"Adaptive Collaborative DNN Inference via Heterogeneous Graph Attention in Edge Environments","display_name":"Adaptive Collaborative DNN Inference via Heterogeneous Graph Attention in Edge Environments","publication_year":2025,"publication_date":"2025-12-24","ids":{"openalex":"https://openalex.org/W7117130991","doi":"https://doi.org/10.1109/jiot.2025.3648047"},"language":null,"primary_location":{"id":"doi:10.1109/jiot.2025.3648047","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jiot.2025.3648047","pdf_url":null,"source":{"id":"https://openalex.org/S2480266640","display_name":"IEEE Internet of Things Journal","issn_l":"2327-4662","issn":["2327-4662","2372-2541"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Internet of Things Journal","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5121181137","display_name":"Chuxuan Shi","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Chuxuan Shi","raw_affiliation_strings":["East-China Research Institute of Computer Technology, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0002-6257-5961","affiliations":[{"raw_affiliation_string":"East-China Research Institute of Computer Technology, Shanghai, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121239867","display_name":"Bo Jiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bo Jiang","raw_affiliation_strings":["East-China Research Institute of Computer Technology, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-0043-6256","affiliations":[{"raw_affiliation_string":"East-China Research Institute of Computer Technology, Shanghai, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121188926","display_name":"Hong Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hong Xu","raw_affiliation_strings":["East-China Research Institute of Computer Technology, Shanghai, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"East-China Research Institute of Computer Technology, Shanghai, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121218948","display_name":"Jinhui Xie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jinhui Xie","raw_affiliation_strings":["East-China Research Institute of Computer Technology, Shanghai, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"East-China Research Institute of Computer Technology, Shanghai, China","institution_ids":[]}]},{"author_position":"last","author":{"id":null,"display_name":"Chenglong Wang","orcid":"https://orcid.org/0009-0003-2555-9572"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chenglong Wang","raw_affiliation_strings":["East-China Research Institute of Computer Technology, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0003-2555-9572","affiliations":[{"raw_affiliation_string":"East-China Research Institute of Computer Technology, Shanghai, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5121181137"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.79908335,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"13","issue":"5","first_page":"10017","last_page":"10034"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.5946000218391418,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.5946000218391418,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.13420000672340393,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.06239999830722809,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.7886000275611877},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.6001999974250793},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.44290000200271606},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.4066999852657318},{"id":"https://openalex.org/keywords/approximate-inference","display_name":"Approximate inference","score":0.365200012922287},{"id":"https://openalex.org/keywords/enhanced-data-rates-for-gsm-evolution","display_name":"Enhanced Data Rates for GSM Evolution","score":0.3573000133037567},{"id":"https://openalex.org/keywords/edge-device","display_name":"Edge device","score":0.34450000524520874},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.3346000015735626}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.850600004196167},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.7886000275611877},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.6001999974250793},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46129998564720154},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.44290000200271606},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4066999852657318},{"id":"https://openalex.org/C2777472644","wikidata":"https://www.wikidata.org/wiki/Q16968992","display_name":"Approximate inference","level":3,"score":0.365200012922287},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.357699990272522},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.3573000133037567},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.34950000047683716},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.34779998660087585},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.34450000524520874},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3346000015735626},{"id":"https://openalex.org/C2778456923","wikidata":"https://www.wikidata.org/wiki/Q5337692","display_name":"Edge computing","level":3,"score":0.3325999975204468},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.3131999969482422},{"id":"https://openalex.org/C107568181","wikidata":"https://www.wikidata.org/wiki/Q5319000","display_name":"Dynamic priority scheduling","level":3,"score":0.30799999833106995},{"id":"https://openalex.org/C55416958","wikidata":"https://www.wikidata.org/wiki/Q6206757","display_name":"Job shop scheduling","level":3,"score":0.298799991607666},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.2768999934196472},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2671999931335449},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.25760000944137573},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.25589999556541443}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/jiot.2025.3648047","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jiot.2025.3648047","pdf_url":null,"source":{"id":"https://openalex.org/S2480266640","display_name":"IEEE Internet of Things Journal","issn_l":"2327-4662","issn":["2327-4662","2372-2541"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Internet of Things Journal","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.5031073093414307}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Deploying":[0],"deep":[1],"neural":[2],"networks":[3],"(DNNs)":[4],"in":[5,40,171],"dynamic":[6,28,93],"edge":[7,29,94,172],"environments":[8],"is":[9],"challenging,":[10],"as":[11],"scheduling":[12,65,127],"decisions":[13],"must":[14],"consider":[15],"both":[16],"the":[17,21,25,125,165],"topological":[18],"complexity":[19],"of":[20,27,167],"DNN":[22,89,169],"model":[23],"and":[24,92,148,161],"variability":[26],"resources.":[30],"Existing":[31],"methods":[32],"often":[33],"fail":[34],"to":[35,56,100,151,164],"balance":[36],"this":[37,44],"trade-off,":[38],"resulting":[39],"suboptimal":[41],"performance.":[42],"In":[43],"study,":[45],"we":[46],"introduce":[47],"Heterogeneous":[48],"Graph-Attention-Network-Based":[49],"Collaborative":[50],"Inference":[51],"(HANCI),":[52],"a":[53,70,77,109,115,120,159],"framework":[54,68],"designed":[55],"minimize":[57],"end-to-end":[58],"inference":[59,141,170],"latency":[60,142],"using":[61],"an":[62],"intelligent,":[63],"context-aware":[64],"approach.":[66],"This":[67,96,156],"employs":[69],"decoupled":[71],"feature":[72],"extraction":[73],"architecture":[74],"based":[75],"on":[76],"heterogeneous":[78],"graph":[79],"attention":[80],"network.":[81],"It":[82,139],"independently":[83],"extracts":[84],"high-quality":[85],"features":[86],"from":[87],"static":[88],"computational":[90],"graphs":[91],"environments.":[95,173],"decoupling":[97],"allows":[98],"HANCI":[99,134],"generate":[101],"comprehensive,":[102],"interference-free":[103],"state":[104],"embeddings.":[105],"These":[106],"embeddings":[107],"support":[108],"hybrid":[110],"decision-making":[111],"strategy":[112],"that":[113,133],"combines":[114],"learned":[116],"partitioning":[117],"policy":[118],"with":[119],"heuristic-guided":[121],"placement":[122],"mechanism,":[123],"making":[124],"complex":[126,154],"problem":[128],"tractable.":[129],"Experimental":[130],"evaluations":[131],"demonstrate":[132],"considerably":[135],"outperforms":[136],"baseline":[137],"methods.":[138],"reduces":[140],"by":[143,149],"21.6%":[144],"for":[145,153],"lightweight":[146],"models":[147],"up":[150],"78.1%":[152],"architectures.":[155],"study":[157],"provides":[158],"robust":[160],"adaptive":[162],"solution":[163],"challenge":[166],"collaborative":[168]},"counts_by_year":[],"updated_date":"2026-02-21T06:11:54.161237","created_date":"2025-12-24T00:00:00"}
