{"id":"https://openalex.org/W3139497941","doi":"https://doi.org/10.1145/3448016.3457267","title":"MetaInsight: Automatic Discovery of Structured Knowledge for Exploratory Data Analysis","display_name":"MetaInsight: Automatic Discovery of Structured Knowledge for Exploratory Data Analysis","publication_year":2021,"publication_date":"2021-06-09","ids":{"openalex":"https://openalex.org/W3139497941","doi":"https://doi.org/10.1145/3448016.3457267","mag":"3139497941"},"language":"en","primary_location":{"id":"doi:10.1145/3448016.3457267","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3448016.3457267","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2021 International Conference on Management of Data","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101728918","display_name":"Pingchuan Ma","orcid":"https://orcid.org/0000-0001-7680-2817"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Pingchuan Ma","raw_affiliation_strings":["Hong Kong University of Science and Technology, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"Hong Kong University of Science and Technology, Hong Kong, China","institution_ids":["https://openalex.org/I200769079"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102930678","display_name":"Rui Ding","orcid":"https://orcid.org/0000-0001-8342-7875"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rui Ding","raw_affiliation_strings":["Microsoft Research, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006300825","display_name":"Shi Han","orcid":"https://orcid.org/0000-0002-0360-6089"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shi Han","raw_affiliation_strings":["Microsoft Research, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100331488","display_name":"Dongmei Zhang","orcid":"https://orcid.org/0000-0002-9230-2799"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dongmei Zhang","raw_affiliation_strings":["Microsoft Research, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101728918"],"corresponding_institution_ids":["https://openalex.org/I200769079"],"apc_list":null,"apc_paid":null,"fwci":6.8854,"has_fulltext":false,"cited_by_count":34,"citation_normalized_percentile":{"value":0.96854537,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1262","last_page":"1274"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12205","display_name":"Time Series Analysis and Forecasting","score":0.9937999844551086,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10799","display_name":"Data Visualization and Analytics","score":0.9936000108718872,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.815019965171814},{"id":"https://openalex.org/keywords/knowledge-extraction","display_name":"Knowledge extraction","score":0.639145016670227},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5676358938217163},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.5523560047149658},{"id":"https://openalex.org/keywords/exploratory-data-analysis","display_name":"Exploratory data analysis","score":0.5063272714614868},{"id":"https://openalex.org/keywords/raw-data","display_name":"Raw data","score":0.4858929514884949},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.4635773003101349},{"id":"https://openalex.org/keywords/exploratory-analysis","display_name":"Exploratory analysis","score":0.46272245049476624},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4447604715824127},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.44075414538383484},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.4344896674156189},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4011506736278534},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.35886526107788086},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.34062033891677856}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.815019965171814},{"id":"https://openalex.org/C120567893","wikidata":"https://www.wikidata.org/wiki/Q1582085","display_name":"Knowledge extraction","level":2,"score":0.639145016670227},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5676358938217163},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.5523560047149658},{"id":"https://openalex.org/C120894424","wikidata":"https://www.wikidata.org/wiki/Q1322871","display_name":"Exploratory data analysis","level":2,"score":0.5063272714614868},{"id":"https://openalex.org/C132964779","wikidata":"https://www.wikidata.org/wiki/Q2110223","display_name":"Raw data","level":2,"score":0.4858929514884949},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.4635773003101349},{"id":"https://openalex.org/C3018260909","wikidata":"https://www.wikidata.org/wiki/Q1322871","display_name":"Exploratory analysis","level":2,"score":0.46272245049476624},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4447604715824127},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.44075414538383484},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.4344896674156189},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4011506736278534},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35886526107788086},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.34062033891677856},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/3448016.3457267","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3448016.3457267","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2021 International Conference on Management of Data","raw_type":"proceedings-article"},{"id":"pmh:oai:repository.hkust.edu.hk:1783.1-111772","is_oa":false,"landing_page_url":"https://repository.hkust.edu.hk/ir/Record/1783.1-111772","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Conference paper"},{"id":"pmh:oai:repository.ust.hk:1783.1-111772","is_oa":false,"landing_page_url":"http://repository.ust.hk/ir/Record/1783.1-111772","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Conference paper"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W346507350","https://openalex.org/W1498726635","https://openalex.org/W1542115404","https://openalex.org/W1565838812","https://openalex.org/W1570418772","https://openalex.org/W1608294808","https://openalex.org/W1631295847","https://openalex.org/W1961845056","https://openalex.org/W1995887163","https://openalex.org/W2015599431","https://openalex.org/W2044240774","https://openalex.org/W2092103580","https://openalex.org/W2098247219","https://openalex.org/W2102297485","https://openalex.org/W2103201239","https://openalex.org/W2113411758","https://openalex.org/W2131920243","https://openalex.org/W2147931936","https://openalex.org/W2152228468","https://openalex.org/W2271163001","https://openalex.org/W2319794630","https://openalex.org/W2327620174","https://openalex.org/W2428096022","https://openalex.org/W2508656285","https://openalex.org/W2592469568","https://openalex.org/W2610226709","https://openalex.org/W2795226127","https://openalex.org/W2798990443","https://openalex.org/W2886887279","https://openalex.org/W2912779949","https://openalex.org/W2915786579","https://openalex.org/W2946535156","https://openalex.org/W2963707382","https://openalex.org/W2964101465","https://openalex.org/W2991028016","https://openalex.org/W2996095251","https://openalex.org/W3032467329","https://openalex.org/W4230230708","https://openalex.org/W4243655015","https://openalex.org/W4296580771","https://openalex.org/W4298206967"],"related_works":["https://openalex.org/W4245696228","https://openalex.org/W3106582992","https://openalex.org/W2106505873","https://openalex.org/W4234525880","https://openalex.org/W1487661898","https://openalex.org/W4293708072","https://openalex.org/W2301896740","https://openalex.org/W2149507315","https://openalex.org/W2905990309","https://openalex.org/W2047528632"],"abstract_inverted_index":{"Automatic":[0],"Exploratory":[1],"Data":[2,124],"Analysis":[3],"(EDA)":[4],"focuses":[5],"on":[6,120,215,221],"automatically":[7,93,195],"discovering":[8],"pieces":[9],"of":[10,15,47,83,102,110,182,208],"knowledge":[11,22,84,116,148,156],"in":[12,170],"the":[13,20,45,121,155,180,204],"form":[14],"interesting":[16],"data":[17,26,88,104,112,136],"patterns.":[18],"However,":[19],"conveyed":[21],"by":[23,133,158],"these":[24,51],"suggested":[25,48],"patterns":[27,49,53,137],"are":[28,54,164],"disjointed":[29],"or":[30],"lack":[31],"organization.":[32],"Therefore,":[33],"it":[34,66],"is":[35,131],"difficult":[36],"for":[37],"users":[38,59,224],"to":[39,57,60,71,90,106,114,178,194],"gain":[40],"structured":[41,81,147],"knowledge,":[42],"and":[43,94,127,143,152,160,186,190,206,218,225],"as":[44],"number":[46],"grows,":[50],"stand-alone":[52],"less":[55],"likely":[56],"motive":[58],"conduct":[61],"follow-up":[62],"analysis,":[63],"which":[64,163],"hinders":[65],"from":[67,86,199],"being":[68],"effectively":[69],"utilized":[70],"facilitate":[72,91],"EDA.":[73,171],"In":[74],"this":[75],"paper,":[76],"we":[77,97],"propose":[78,98,173],"MetaInsight,":[79,183],"a":[80,99,174,191],"representation":[82],"extracted":[85],"multi-dimensional":[87,200],"aiming":[89],"EDA":[92],"effectively.":[95],"Specifically,":[96],"novel":[100,175],"formulation":[101],"basic":[103,135],"pattern":[105],"capture":[107],"essential":[108],"characteristics":[109],"raw":[111],"distribution":[113],"achieve":[115],"extraction.":[117],"Then":[118],"based":[119],"mined":[122],"Homogeneous":[123],"Patterns":[125],"(HDP)":[126],"inter-pattern":[128],"similarity,":[129],"MetaInsight":[130],"identified":[132],"categorizing":[134],"(within":[138],"an":[139,184],"HDP)":[140],"into":[141],"commonness(es)":[142,151],"exceptions":[144,153],"thus":[145],"achieving":[146],"representation.":[149],"The":[150],"concretize":[154],"obtained":[157],"induction":[159],"validation":[161],"processes":[162],"two":[165],"typical":[166],"analysis":[167],"mechanisms":[168],"conducted":[169],"We":[172,202],"scoring":[176],"function":[177],"quantify":[179],"usefulness":[181],"effective":[185],"efficient":[187],"mining":[188],"procedure":[189],"ranking":[192],"algorithm":[193],"discover":[196],"high-quality":[197],"MetaInsights":[198,209],"data.":[201],"demonstrate":[203],"effectiveness":[205],"efficiency":[207],"(w.r.t.":[210],"facilitating":[211],"EDA)":[212],"through":[213],"evaluation":[214],"real-world":[216],"datasets":[217],"user":[219],"studies":[220],"both":[222],"expert":[223],"non-expert":[226],"users.":[227]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":12},{"year":2023,"cited_by_count":11},{"year":2022,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
