{"id":"https://openalex.org/W4387360065","doi":"https://doi.org/10.1145/3609437.3609457","title":"Practical Accuracy Evaluation for Deep Learning Systems via Latent Representation Discrepancy","display_name":"Practical Accuracy Evaluation for Deep Learning Systems via Latent Representation Discrepancy","publication_year":2023,"publication_date":"2023-08-04","ids":{"openalex":"https://openalex.org/W4387360065","doi":"https://doi.org/10.1145/3609437.3609457"},"language":"en","primary_location":{"id":"doi:10.1145/3609437.3609457","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3609437.3609457","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 14th Asia-Pacific Symposium on Internetware","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5057680987","display_name":"Yining Yin","orcid":"https://orcid.org/0009-0001-1574-2758"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yining Yin","raw_affiliation_strings":["State Key Laboratory for Novel Software Technology, Nanjing University, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory for Novel Software Technology, Nanjing University, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043981758","display_name":"Yang Feng","orcid":"https://orcid.org/0000-0002-7477-3642"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yang Feng","raw_affiliation_strings":["State Key Laboratory for Novel Software Technology, Nanjing University, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory for Novel Software Technology, Nanjing University, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101410200","display_name":"Zixi Liu","orcid":"https://orcid.org/0000-0002-3271-7255"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zixi Liu","raw_affiliation_strings":["State Key Laboratory for Novel Software Technology, Nanjing University, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory for Novel Software Technology, Nanjing University, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046549364","display_name":"Zhihong Zhao","orcid":"https://orcid.org/0009-0002-4629-6372"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhihong Zhao","raw_affiliation_strings":["State Key Laboratory for Novel Software Technology, Nanjing University, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory for Novel Software Technology, Nanjing University, China","institution_ids":["https://openalex.org/I881766915"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5057680987"],"corresponding_institution_ids":["https://openalex.org/I881766915"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.12569129,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"205","last_page":"215"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9943000078201294,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9933000206947327,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.786526620388031},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.6943798065185547},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.6630775332450867},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6158918142318726},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6126616597175598},{"id":"https://openalex.org/keywords/vulnerability","display_name":"Vulnerability (computing)","score":0.5373194813728333},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5062283873558044},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.48628246784210205},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.4449147582054138},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.4341084361076355},{"id":"https://openalex.org/keywords/test-data","display_name":"Test data","score":0.41351693868637085},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3651566505432129},{"id":"https://openalex.org/keywords/reliability-engineering","display_name":"Reliability engineering","score":0.34772396087646484},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.1411707103252411},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.109159916639328},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.07940691709518433}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.786526620388031},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.6943798065185547},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.6630775332450867},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6158918142318726},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6126616597175598},{"id":"https://openalex.org/C95713431","wikidata":"https://www.wikidata.org/wiki/Q631425","display_name":"Vulnerability (computing)","level":2,"score":0.5373194813728333},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5062283873558044},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.48628246784210205},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.4449147582054138},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.4341084361076355},{"id":"https://openalex.org/C16910744","wikidata":"https://www.wikidata.org/wiki/Q7705759","display_name":"Test data","level":2,"score":0.41351693868637085},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3651566505432129},{"id":"https://openalex.org/C200601418","wikidata":"https://www.wikidata.org/wiki/Q2193887","display_name":"Reliability engineering","level":1,"score":0.34772396087646484},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.1411707103252411},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.109159916639328},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.07940691709518433},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3609437.3609457","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3609437.3609457","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 14th Asia-Pacific Symposium on Internetware","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W1987971958","https://openalex.org/W2124244761","https://openalex.org/W2139137304","https://openalex.org/W2616028256","https://openalex.org/W2799640043","https://openalex.org/W2804337238","https://openalex.org/W2888824816","https://openalex.org/W2948254043","https://openalex.org/W2954629067","https://openalex.org/W2954996726","https://openalex.org/W2957905354","https://openalex.org/W2995858837","https://openalex.org/W3000442532","https://openalex.org/W3009330671","https://openalex.org/W3041012898","https://openalex.org/W3042703469","https://openalex.org/W3090943961","https://openalex.org/W3105347387","https://openalex.org/W3124058431","https://openalex.org/W3125205424"],"related_works":["https://openalex.org/W4377865163","https://openalex.org/W3193857078","https://openalex.org/W2888956734","https://openalex.org/W4315865067","https://openalex.org/W2979433843","https://openalex.org/W3208304128","https://openalex.org/W3000197790","https://openalex.org/W209733029","https://openalex.org/W2891480213","https://openalex.org/W3118953353"],"abstract_inverted_index":{"As":[0],"deep":[1,28],"learning":[2,29],"systems":[3,39],"have":[4,16,54,78,100],"been":[5,101],"widely":[6],"deployed":[7],"in":[8,56,105],"many":[9],"safety-critical":[10],"scenarios,":[11],"their":[12,57],"quality":[13,22],"and":[14,23,49,74,87,133],"reliability":[15],"raised":[17],"growing":[18],"concerns.":[19],"Assuring":[20],"the":[21,25,68,82,85,107,115],"evaluating":[24],"accuracy":[26],"of":[27,44,84,117],"models":[30,53],"could":[31],"be":[32],"challenging":[33],"because,":[34],"unlike":[35],"traditional":[36],"software,":[37],"DL":[38,52,92,108],"rely":[40],"on":[41,60,81],"large":[42],"amounts":[43],"labeled":[45,118],"data":[46,124],"for":[47],"training":[48,73],"evaluation.":[50],"The":[51],"variability":[55],"behavioral":[58],"features":[59],"datasets":[61],"with":[62],"different":[63],"distributions.":[64],"In":[65],"practical":[66],"application,":[67],"potential":[69],"distribution":[70],"shift":[71],"between":[72],"usage":[75],"scenarios":[76,129],"may":[77],"an":[79],"impact":[80],"performance":[83],"model":[86],"bring":[88],"extra":[89],"vulnerability":[90],"to":[91,103],"systems.":[93],"Although":[94],"some":[95],"neuron":[96],"coverage":[97],"testing":[98,106],"criteria":[99],"proposed":[102],"assist":[104],"systems,":[109],"they":[110],"are":[111],"still":[112],"limited":[113],"by":[114],"amount":[116],"data.":[119],"Meanwhile,":[120],"manual":[121],"labeling":[122],"test":[123],"collected":[125],"from":[126],"real-world":[127],"application":[128],"is":[130],"very":[131],"time-consuming":[132],"costly.":[134]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
