{"id":"https://openalex.org/W3201880832","doi":"https://doi.org/10.1007/s00778-021-00704-2","title":"ABSTAT-HD: a scalable tool for profiling very large knowledge graphs","display_name":"ABSTAT-HD: a scalable tool for profiling very large knowledge graphs","publication_year":2021,"publication_date":"2021-09-29","ids":{"openalex":"https://openalex.org/W3201880832","doi":"https://doi.org/10.1007/s00778-021-00704-2","mag":"3201880832"},"language":"en","primary_location":{"id":"doi:10.1007/s00778-021-00704-2","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00778-021-00704-2","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00778-021-00704-2.pdf","source":{"id":"https://openalex.org/S78926909","display_name":"The VLDB Journal","issn_l":"0949-877X","issn":["0949-877X","1066-8888"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The VLDB Journal","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s00778-021-00704-2.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5081119903","display_name":"Renzo Arturo Alva Principe","orcid":null},"institutions":[{"id":"https://openalex.org/I66752286","display_name":"University of Milano-Bicocca","ror":"https://ror.org/01ynf4891","country_code":"IT","type":"education","lineage":["https://openalex.org/I66752286"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Renzo Arturo Alva Principe","raw_affiliation_strings":["Department of Informatics, Systems and Communication, University of Milano-Bicocca, Viale Sarca, 336, Milan, Italy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Informatics, Systems and Communication, University of Milano-Bicocca, Viale Sarca, 336, Milan, Italy","institution_ids":["https://openalex.org/I66752286"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067371383","display_name":"Andrea Maurino","orcid":"https://orcid.org/0000-0001-9803-3668"},"institutions":[{"id":"https://openalex.org/I66752286","display_name":"University of Milano-Bicocca","ror":"https://ror.org/01ynf4891","country_code":"IT","type":"education","lineage":["https://openalex.org/I66752286"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Andrea Maurino","raw_affiliation_strings":["Department of Informatics, Systems and Communication, University of Milano-Bicocca, Viale Sarca, 336, Milan, Italy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Informatics, Systems and Communication, University of Milano-Bicocca, Viale Sarca, 336, Milan, Italy","institution_ids":["https://openalex.org/I66752286"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065845420","display_name":"Matteo Palmonari","orcid":"https://orcid.org/0000-0002-1801-5118"},"institutions":[{"id":"https://openalex.org/I66752286","display_name":"University of Milano-Bicocca","ror":"https://ror.org/01ynf4891","country_code":"IT","type":"education","lineage":["https://openalex.org/I66752286"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Matteo Palmonari","raw_affiliation_strings":["Department of Informatics, Systems and Communication, University of Milano-Bicocca, Viale Sarca, 336, Milan, Italy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Informatics, Systems and Communication, University of Milano-Bicocca, Viale Sarca, 336, Milan, Italy","institution_ids":["https://openalex.org/I66752286"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079768184","display_name":"Michele Ciavotta","orcid":"https://orcid.org/0000-0002-2480-966X"},"institutions":[{"id":"https://openalex.org/I66752286","display_name":"University of Milano-Bicocca","ror":"https://ror.org/01ynf4891","country_code":"IT","type":"education","lineage":["https://openalex.org/I66752286"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Michele Ciavotta","raw_affiliation_strings":["Department of Informatics, Systems and Communication, University of Milano-Bicocca, Viale Sarca, 336, Milan, Italy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Informatics, Systems and Communication, University of Milano-Bicocca, Viale Sarca, 336, Milan, Italy","institution_ids":["https://openalex.org/I66752286"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5088767562","display_name":"Blerina Spahiu","orcid":"https://orcid.org/0000-0002-6958-8215"},"institutions":[{"id":"https://openalex.org/I66752286","display_name":"University of Milano-Bicocca","ror":"https://ror.org/01ynf4891","country_code":"IT","type":"education","lineage":["https://openalex.org/I66752286"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Blerina Spahiu","raw_affiliation_strings":["Department of Informatics, Systems and Communication, University of Milano-Bicocca, Viale Sarca, 336, Milan, Italy"],"raw_orcid":"https://orcid.org/0000-0002-6958-8215","affiliations":[{"raw_affiliation_string":"Department of Informatics, Systems and Communication, University of Milano-Bicocca, Viale Sarca, 336, Milan, Italy","institution_ids":["https://openalex.org/I66752286"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5081119903"],"corresponding_institution_ids":["https://openalex.org/I66752286"],"apc_list":{"value":2290,"currency":"EUR","value_usd":2890},"apc_paid":{"value":2290,"currency":"EUR","value_usd":2890},"fwci":1.3994,"has_fulltext":true,"cited_by_count":12,"citation_normalized_percentile":{"value":0.85153186,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"31","issue":"5","first_page":"851","last_page":"876"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/profiling","display_name":"Profiling (computer programming)","score":0.8758980631828308},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7723844647407532},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.7157886624336243},{"id":"https://openalex.org/keywords/workload","display_name":"Workload","score":0.5047577619552612},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.4486503601074219},{"id":"https://openalex.org/keywords/recommender-system","display_name":"Recommender system","score":0.42701587080955505},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.4036751985549927},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3978470265865326},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3400077819824219},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.33783793449401855},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3367946445941925},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.12318897247314453},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.09447595477104187}],"concepts":[{"id":"https://openalex.org/C187191949","wikidata":"https://www.wikidata.org/wiki/Q1138496","display_name":"Profiling (computer programming)","level":2,"score":0.8758980631828308},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7723844647407532},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.7157886624336243},{"id":"https://openalex.org/C2778476105","wikidata":"https://www.wikidata.org/wiki/Q628539","display_name":"Workload","level":2,"score":0.5047577619552612},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.4486503601074219},{"id":"https://openalex.org/C557471498","wikidata":"https://www.wikidata.org/wiki/Q554950","display_name":"Recommender system","level":2,"score":0.42701587080955505},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.4036751985549927},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3978470265865326},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3400077819824219},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.33783793449401855},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3367946445941925},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.12318897247314453},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.09447595477104187},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1007/s00778-021-00704-2","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00778-021-00704-2","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00778-021-00704-2.pdf","source":{"id":"https://openalex.org/S78926909","display_name":"The VLDB Journal","issn_l":"0949-877X","issn":["0949-877X","1066-8888"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The VLDB Journal","raw_type":"journal-article"},{"id":"pmh:oai:boa.unimib.it:10281/327617","is_oa":true,"landing_page_url":"https://hdl.handle.net/10281/327617","pdf_url":null,"source":{"id":"https://openalex.org/S4306401259","display_name":"BOA (University of Milano-Bicocca)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I66752286","host_organization_name":"University of Milano-Bicocca","host_organization_lineage":["https://openalex.org/I66752286"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/article"},{"id":"pmh:oai:zenodo.org:152650","is_oa":true,"landing_page_url":"https://www.openaccessrepository.it/record/152650","pdf_url":null,"source":{"id":"https://openalex.org/S4306402478","display_name":"INFM-OAR (INFN Catania)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210116497","host_organization_name":"Istituto Nazionale di Fisica Nucleare, Sezione di Catania","host_organization_lineage":["https://openalex.org/I4210116497"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":{"id":"doi:10.1007/s00778-021-00704-2","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00778-021-00704-2","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00778-021-00704-2.pdf","source":{"id":"https://openalex.org/S78926909","display_name":"The VLDB Journal","issn_l":"0949-877X","issn":["0949-877X","1066-8888"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The VLDB Journal","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.6100000143051147,"id":"https://metadata.un.org/sdg/8","display_name":"Decent work and economic growth"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321610","display_name":"Universit\u00e0 degli Studi di Milano-Bicocca","ror":"https://ror.org/01ynf4891"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3201880832.pdf","grobid_xml":"https://content.openalex.org/works/W3201880832.grobid-xml"},"referenced_works_count":63,"referenced_works":["https://openalex.org/W170065150","https://openalex.org/W1529522905","https://openalex.org/W1805882648","https://openalex.org/W1934051226","https://openalex.org/W1988497694","https://openalex.org/W2036959307","https://openalex.org/W2038412523","https://openalex.org/W2038669342","https://openalex.org/W2043795443","https://openalex.org/W2056613579","https://openalex.org/W2081385143","https://openalex.org/W2114303224","https://openalex.org/W2125442437","https://openalex.org/W2136679991","https://openalex.org/W2162381184","https://openalex.org/W2171539317","https://openalex.org/W2222040190","https://openalex.org/W2250093878","https://openalex.org/W2268506948","https://openalex.org/W2273009367","https://openalex.org/W2282967241","https://openalex.org/W2399172669","https://openalex.org/W2400515935","https://openalex.org/W2401813704","https://openalex.org/W2418808916","https://openalex.org/W2464382551","https://openalex.org/W2471601082","https://openalex.org/W2620880249","https://openalex.org/W2755658662","https://openalex.org/W2789058128","https://openalex.org/W2790755967","https://openalex.org/W2805757480","https://openalex.org/W2807283351","https://openalex.org/W2808168743","https://openalex.org/W2809533051","https://openalex.org/W2810302553","https://openalex.org/W2886604633","https://openalex.org/W2890036314","https://openalex.org/W2891796645","https://openalex.org/W2893978701","https://openalex.org/W2902810976","https://openalex.org/W2912515744","https://openalex.org/W2942430644","https://openalex.org/W2951493102","https://openalex.org/W2953749256","https://openalex.org/W2964221236","https://openalex.org/W2966787092","https://openalex.org/W2979842165","https://openalex.org/W3003770903","https://openalex.org/W3010336026","https://openalex.org/W3015245730","https://openalex.org/W3042393666","https://openalex.org/W3046641529","https://openalex.org/W3091993229","https://openalex.org/W3100940592","https://openalex.org/W3105298605","https://openalex.org/W3106394530","https://openalex.org/W3122581267","https://openalex.org/W3146366406","https://openalex.org/W3168438209","https://openalex.org/W4200329746","https://openalex.org/W4285719527","https://openalex.org/W4288343461"],"related_works":["https://openalex.org/W2000785801","https://openalex.org/W986318368","https://openalex.org/W2384410913","https://openalex.org/W2352878646","https://openalex.org/W4390608645","https://openalex.org/W2004734601","https://openalex.org/W4390273403","https://openalex.org/W2130149817","https://openalex.org/W2990194547","https://openalex.org/W1480123525"],"abstract_inverted_index":{"Abstract":[0],"Processing":[1],"large-scale":[2],"and":[3,37,50,79,82,119,130,133,136],"highly":[4,70],"interconnected":[5],"Knowledge":[6],"Graphs":[7],"(KG)":[8],"is":[9],"becoming":[10],"crucial":[11],"for":[12],"many":[13],"applications":[14],"such":[15,54],"as":[16,55],"recommender":[17],"systems,":[18],"question":[19],"answering,":[20],"etc.":[21],"Profiling":[22],"approaches":[23],"have":[24],"been":[25],"proposed":[26],"to":[27,34,108,114],"summarize":[28],"large":[29,139],"KGs":[30],"with":[31,106],"the":[32,88,91,112],"aim":[33],"produce":[35],"concise":[36,131],"meaningful":[38],"representation":[39],"so":[40],"that":[41,74,102,124],"they":[42],"can":[43,134],"be":[44,115],"easily":[45],"managed.":[46],"However,":[47],"constructing":[48],"profiles":[49],"calculating":[51],"several":[52],"statistics":[53],"cardinality":[56],"descriptors":[57],"or":[58],"inferences":[59],"are":[60],"resource":[61],"expensive.":[62],"In":[63],"this":[64],"paper,":[65],"we":[66],"present":[67],"ABSTAT-HD,":[68],"a":[69,98],"distributed":[71],"profiling":[72,78,126],"tool":[73],"supports":[75],"users":[76],"in":[77],"understanding":[80],"big":[81],"complex":[83],"knowledge":[84],"graphs.":[85],"We":[86],"demonstrate":[87],"impact":[89],"of":[90,94,100,111],"new":[92],"architecture":[93],"ABSTAT-HD":[95],"by":[96],"presenting":[97],"set":[99],"experiments":[101],"show":[103],"its":[104],"scalability":[105],"respect":[107],"three":[109],"dimensions":[110],"data":[113],"processed:":[116],"size,":[117],"complexity":[118],"workload.":[120],"The":[121],"experimentation":[122],"shows":[123],"our":[125],"framework":[127],"provides":[128],"informative":[129],"profiles,":[132],"process":[135],"manage":[137],"very":[138],"KGs.":[140]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":1}],"updated_date":"2026-05-29T09:21:14.243279","created_date":"2021-10-11T00:00:00"}
