{"id":"https://openalex.org/W4308627439","doi":"https://doi.org/10.1145/3549037.3570195","title":"Data quality and model under-specification issues (keynote)","display_name":"Data quality and model under-specification issues (keynote)","publication_year":2022,"publication_date":"2022-11-07","ids":{"openalex":"https://openalex.org/W4308627439","doi":"https://doi.org/10.1145/3549037.3570195"},"language":"en","primary_location":{"id":"doi:10.1145/3549037.3570195","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3549037.3570195","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2nd International Workshop on Software Engineering and AI for Data Quality in Cyber-Physical Systems/Internet of Things","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5040665094","display_name":"Foutse Khomh","orcid":null},"institutions":[{"id":"https://openalex.org/I45683168","display_name":"Polytechnique Montr\u00e9al","ror":"https://ror.org/05f8d4e86","country_code":"CA","type":"education","lineage":["https://openalex.org/I45683168"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Foutse Khomh","raw_affiliation_strings":["Polytechnique Montr\u00e9al, Canada"],"affiliations":[{"raw_affiliation_string":"Polytechnique Montr\u00e9al, Canada","institution_ids":["https://openalex.org/I45683168"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5040665094"],"corresponding_institution_ids":["https://openalex.org/I45683168"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.11416715,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"2","last_page":"2"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.989799976348877,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7575781345367432},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.6896002292633057},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.6285960078239441},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.6027539372444153},{"id":"https://openalex.org/keywords/data-quality","display_name":"Data quality","score":0.5584415197372437},{"id":"https://openalex.org/keywords/data-modeling","display_name":"Data modeling","score":0.5387289524078369},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.5023162364959717},{"id":"https://openalex.org/keywords/root-cause","display_name":"Root cause","score":0.4747909903526306},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.37902793288230896},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3668307065963745},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.333313524723053},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.15176475048065186},{"id":"https://openalex.org/keywords/reliability-engineering","display_name":"Reliability engineering","score":0.13937535881996155},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.10530966520309448},{"id":"https://openalex.org/keywords/operations-management","display_name":"Operations management","score":0.10104450583457947}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7575781345367432},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.6896002292633057},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.6285960078239441},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.6027539372444153},{"id":"https://openalex.org/C24756922","wikidata":"https://www.wikidata.org/wiki/Q1757694","display_name":"Data quality","level":3,"score":0.5584415197372437},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.5387289524078369},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.5023162364959717},{"id":"https://openalex.org/C84945661","wikidata":"https://www.wikidata.org/wiki/Q7366567","display_name":"Root cause","level":2,"score":0.4747909903526306},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.37902793288230896},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3668307065963745},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.333313524723053},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.15176475048065186},{"id":"https://openalex.org/C200601418","wikidata":"https://www.wikidata.org/wiki/Q2193887","display_name":"Reliability engineering","level":1,"score":0.13937535881996155},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.10530966520309448},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.10104450583457947},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3549037.3570195","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3549037.3570195","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2nd International Workshop on Software Engineering and AI for Data Quality in Cyber-Physical Systems/Internet of Things","raw_type":"proceedings-article"},{"id":"pmh:oai:publications.polymtl.ca:56839","is_oa":false,"landing_page_url":"https://publications.polymtl.ca/56839/","pdf_url":null,"source":{"id":"https://openalex.org/S4306401013","display_name":"PolyPublie (\u00c9cole Polytechnique de Montr\u00e9al)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I45683168","host_organization_name":"Polytechnique Montr\u00e9al","host_organization_lineage":["https://openalex.org/I45683168"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Communication de conf\u00e9rence"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3037187668","https://openalex.org/W4234772502","https://openalex.org/W2380685755","https://openalex.org/W2252100032","https://openalex.org/W2963436428","https://openalex.org/W3081133439","https://openalex.org/W4386246791","https://openalex.org/W3211701140","https://openalex.org/W2952280724","https://openalex.org/W2133103607"],"abstract_inverted_index":{"Nowadays,":[0],"we":[1,84,106],"are":[2],"witnessing":[3],"an":[4],"increasing":[5],"demand":[6],"in":[7,59],"both":[8],"industry":[9],"and":[10,35,51,103],"academia":[11],"for":[12,94],"exploiting":[13],"Deep":[14],"Learning":[15],"(DL)":[16],"to":[17,87,109],"solve":[18],"complex":[19],"real-world":[20],"problems.":[21],"However,":[22],"the":[23,33,52,112],"performance":[24],"of":[25,37,44,54,91,115],"these":[26],"high-capacity":[27],"learners":[28],"is":[29],"currently":[30],"bounded":[31],"by":[32],"quality":[34],"volume":[36],"their":[38],"underlying":[39],"training":[40,49,61,124],"data.":[41],"The":[42],"use":[43],"incomplete,":[45],"erroneous,":[46],"or":[47,68],"inappropriate":[48],"data,":[50],"implementation":[53],"poor":[55],"data":[56,92],"management":[57,93],"practices":[58,90],"a":[60,122],"pipeline":[62],"often":[63],"result":[64],"into":[65],"unreliable,":[66],"biased,":[67],"under":[69],"specified":[70],"models.":[71],"In":[72],"this":[73],"talk,":[74],"I":[75,96],"will":[76,97],"report":[77,99],"about":[78,100],"some":[79],"recent":[80,101],"research":[81],"works":[82],"that":[83,105],"have":[85,107],"conducted":[86],"identify":[88],"best":[89],"DL.":[95],"also":[98],"techniques":[102],"tools":[104],"developed":[108],"help":[110],"detect":[111],"root":[113],"cause":[114],"model":[116],"under-specification":[117],"issues":[118],"early":[119],"on":[120],"during":[121],"DL":[123],"process.":[125]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
