{"id":"https://openalex.org/W2064736030","doi":"https://doi.org/10.1631/jzus.c1101007","title":"VDoc+: a virtual document based approach for matching large ontologies using MapReduce","display_name":"VDoc+: a virtual document based approach for matching large ontologies using MapReduce","publication_year":2012,"publication_date":"2012-04-01","ids":{"openalex":"https://openalex.org/W2064736030","doi":"https://doi.org/10.1631/jzus.c1101007","mag":"2064736030"},"language":"en","primary_location":{"id":"doi:10.1631/jzus.c1101007","is_oa":false,"landing_page_url":"https://doi.org/10.1631/jzus.c1101007","pdf_url":null,"source":{"id":"https://openalex.org/S199067057","display_name":"Journal of Zhejiang University SCIENCE C","issn_l":"1869-1951","issn":["1869-1951","1869-196X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311937","host_organization_name":"Zhejiang University Press","host_organization_lineage":["https://openalex.org/P4310311937"],"host_organization_lineage_names":["Zhejiang University Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Zhejiang University SCIENCE C","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100438478","display_name":"Hang Zhang","orcid":"https://orcid.org/0000-0003-2514-0811"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]},{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hang Zhang","raw_affiliation_strings":["Department of Computer Science and Technology, Nanjing University, Nanjing, 210093, China","State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, 210093, China","State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China","Department of Computer Science and Technology, Nanjing University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, Nanjing University, Nanjing, 210093, China","institution_ids":["https://openalex.org/I36399199"]},{"raw_affiliation_string":"State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, 210093, China","institution_ids":["https://openalex.org/I881766915"]},{"raw_affiliation_string":"State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]},{"raw_affiliation_string":"Department of Computer Science and Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100727084","display_name":"Wei Hu","orcid":"https://orcid.org/0000-0003-3635-6335"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]},{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Wei Hu","raw_affiliation_strings":["Department of Computer Science and Technology, Nanjing University, Nanjing, 210093, China","State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, 210093, China","State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China","Department of Computer Science and Technology, Nanjing University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, Nanjing University, Nanjing, 210093, China","institution_ids":["https://openalex.org/I36399199"]},{"raw_affiliation_string":"State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, 210093, China","institution_ids":["https://openalex.org/I881766915"]},{"raw_affiliation_string":"State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]},{"raw_affiliation_string":"Department of Computer Science and Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5089586983","display_name":"Yuzhong Qu","orcid":"https://orcid.org/0000-0003-2777-8149"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]},{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yu-zhong Qu","raw_affiliation_strings":["Department of Computer Science and Technology, Nanjing University, Nanjing, 210093, China","State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, 210093, China","State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China","Department of Computer Science and Technology, Nanjing University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, Nanjing University, Nanjing, 210093, China","institution_ids":["https://openalex.org/I36399199"]},{"raw_affiliation_string":"State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, 210093, China","institution_ids":["https://openalex.org/I881766915"]},{"raw_affiliation_string":"State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]},{"raw_affiliation_string":"Department of Computer Science and Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100727084"],"corresponding_institution_ids":["https://openalex.org/I36399199","https://openalex.org/I881766915"],"apc_list":null,"apc_paid":null,"fwci":2.1407,"has_fulltext":false,"cited_by_count":15,"citation_normalized_percentile":{"value":0.8851741,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"13","issue":"4","first_page":"257","last_page":"267"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10679","display_name":"Service-Oriented Architecture and Web Services","score":0.9872000217437744,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.9165925979614258},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6380031108856201},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5967966914176941},{"id":"https://openalex.org/keywords/testbed","display_name":"Testbed","score":0.5809964537620544},{"id":"https://openalex.org/keywords/ontology-alignment","display_name":"Ontology alignment","score":0.579338788986206},{"id":"https://openalex.org/keywords/ontology","display_name":"Ontology","score":0.559857189655304},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5052717328071594},{"id":"https://openalex.org/keywords/semantic-web","display_name":"Semantic Web","score":0.48171693086624146},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.47534772753715515},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.45678409934043884},{"id":"https://openalex.org/keywords/rdf","display_name":"RDF","score":0.4556272029876709},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4410158097743988},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.42348527908325195},{"id":"https://openalex.org/keywords/tf\u2013idf","display_name":"tf\u2013idf","score":0.4183949828147888},{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.2992951571941376},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.19759032130241394},{"id":"https://openalex.org/keywords/upper-ontology","display_name":"Upper ontology","score":0.13915035128593445},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.13470274209976196}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9165925979614258},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6380031108856201},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5967966914176941},{"id":"https://openalex.org/C31395832","wikidata":"https://www.wikidata.org/wiki/Q1318674","display_name":"Testbed","level":2,"score":0.5809964537620544},{"id":"https://openalex.org/C98893333","wikidata":"https://www.wikidata.org/wiki/Q4339878","display_name":"Ontology alignment","level":4,"score":0.579338788986206},{"id":"https://openalex.org/C25810664","wikidata":"https://www.wikidata.org/wiki/Q44325","display_name":"Ontology","level":2,"score":0.559857189655304},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5052717328071594},{"id":"https://openalex.org/C2129575","wikidata":"https://www.wikidata.org/wiki/Q54837","display_name":"Semantic Web","level":2,"score":0.48171693086624146},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.47534772753715515},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.45678409934043884},{"id":"https://openalex.org/C147497476","wikidata":"https://www.wikidata.org/wiki/Q54872","display_name":"RDF","level":3,"score":0.4556272029876709},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4410158097743988},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.42348527908325195},{"id":"https://openalex.org/C81758059","wikidata":"https://www.wikidata.org/wiki/Q796584","display_name":"tf\u2013idf","level":3,"score":0.4183949828147888},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.2992951571941376},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.19759032130241394},{"id":"https://openalex.org/C78726541","wikidata":"https://www.wikidata.org/wiki/Q3882785","display_name":"Upper ontology","level":3,"score":0.13915035128593445},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.13470274209976196},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1631/jzus.c1101007","is_oa":false,"landing_page_url":"https://doi.org/10.1631/jzus.c1101007","pdf_url":null,"source":{"id":"https://openalex.org/S199067057","display_name":"Journal of Zhejiang University SCIENCE C","issn_l":"1869-1951","issn":["1869-1951","1869-196X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311937","host_organization_name":"Zhejiang University Press","host_organization_lineage":["https://openalex.org/P4310311937"],"host_organization_lineage_names":["Zhejiang University Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Zhejiang University SCIENCE C","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W45122933","https://openalex.org/W59949337","https://openalex.org/W173475825","https://openalex.org/W1489772007","https://openalex.org/W1568781071","https://openalex.org/W1586850883","https://openalex.org/W1588213250","https://openalex.org/W1596947943","https://openalex.org/W1956559956","https://openalex.org/W2001877354","https://openalex.org/W2007226769","https://openalex.org/W2051582400","https://openalex.org/W2076063237","https://openalex.org/W2114538147","https://openalex.org/W2141051060","https://openalex.org/W2148014577","https://openalex.org/W2151930506","https://openalex.org/W2152928065","https://openalex.org/W2159083188","https://openalex.org/W2168080006","https://openalex.org/W2173213060","https://openalex.org/W2325227998","https://openalex.org/W2611894836","https://openalex.org/W2615115461","https://openalex.org/W2615447451","https://openalex.org/W4232845329","https://openalex.org/W6601866777","https://openalex.org/W6602455202","https://openalex.org/W6640862754"],"related_works":["https://openalex.org/W2168961710","https://openalex.org/W2169105971","https://openalex.org/W2968390902","https://openalex.org/W132650287","https://openalex.org/W116095830","https://openalex.org/W785749360","https://openalex.org/W4390992395","https://openalex.org/W2799919776","https://openalex.org/W1516708053","https://openalex.org/W2394142077"],"abstract_inverted_index":{"Many":[0],"ontologies":[1,18],"have":[2,22],"been":[3],"published":[4],"on":[5,47,68,157],"the":[6,23,48,69,83,88,103,106,129,139,148,163,176,181],"Semantic":[7],"Web,":[8],"to":[9,12,86,119,142],"be":[10],"shared":[11],"describe":[13],"resources.":[14],"Among":[15],"them,":[16],"large":[17,65],"of":[19,91],"real-world":[20],"areas":[21],"scalability":[24],"problem":[25],"in":[26,82,113,138,187],"presenting":[27],"semantic":[28],"technologies":[29],"such":[30],"as":[31],"ontology":[32],"matching":[33,64],"(OM).":[34],"This":[35,123],"either":[36],"suffers":[37],"from":[38,128,166],"too":[39],"long":[40],"run":[41,182],"time":[42,183],"or":[43],"has":[44],"strong":[45],"hypotheses":[46],"running":[49],"environment.":[50],"To":[51],"deal":[52],"with":[53,111,184],"this":[54],"issue,":[55],"we":[56],"propose":[57],"a":[58],"three-stage":[59],"MapReduce-based":[60,130],"approach":[61,178],"V-Doc+":[62],"for":[63],"ontologies,":[66],"based":[67],"MapReduce":[70,78],"framework":[71],"and":[72,96,98,162,189],"virtual":[73,121],"document":[74,151],"technique.":[75],"Specifically,":[76],"two":[77,158],"processes":[79],"are":[80,109,172],"performed":[81],"first":[84],"stage":[85,141],"extract":[87],"textual":[89],"descriptions":[90,108],"named":[92],"entities":[93],"(classes,":[94],"properties,":[95],"instances)":[97],"blank":[99],"nodes,":[100],"respectively.":[101],"In":[102],"second":[104],"stage,":[105],"extracted":[107],"exchanged":[110],"neighbors":[112],"Resource":[114],"Description":[115],"Framework":[116],"(RDF)":[117],"graphs":[118],"construct":[120],"documents.":[122],"extraction":[124],"process":[125],"also":[126],"benefits":[127],"implementation.":[131],"A":[132],"word-weight-based":[133],"partitioning":[134],"method":[135],"is":[136],"proposed":[137,177],"third":[140],"conduct":[143],"parallel":[144],"similarity":[145],"calculation":[146],"using":[147],"term":[149],"frequency-inverse":[150],"frequency":[152],"(TF-IDF)":[153],"model.":[154],"Experimental":[155],"results":[156],"large-scale":[159],"real":[160],"datasets":[161],"benchmark":[164],"testbed":[165],"Ontology":[167],"Alignment":[168],"Evaluation":[169],"Initiative":[170],"(OAEI)":[171],"reported,":[173],"showing":[174],"that":[175],"significantly":[179],"reduces":[180],"minor":[185],"loss":[186],"precision":[188],"recall.":[190]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":3},{"year":2013,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
