{"id":"https://openalex.org/W2783963764","doi":"https://doi.org/10.1109/bigdata.2017.8258174","title":"Building new knowledge from distributed scientific corpus: HERBADROP &amp; EUROPEANA: Two concrete case studies for exploring big archival data","display_name":"Building new knowledge from distributed scientific corpus: HERBADROP &amp; EUROPEANA: Two concrete case studies for exploring big archival data","publication_year":2017,"publication_date":"2017-12-01","ids":{"openalex":"https://openalex.org/W2783963764","doi":"https://doi.org/10.1109/bigdata.2017.8258174","mag":"2783963764"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata.2017.8258174","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2017.8258174","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084822210","display_name":"Pascal Dug\u00e9nie","orcid":null},"institutions":[{"id":"https://openalex.org/I4210091683","display_name":"Centre Informatique National de l'Enseignement Sup\u00e9rieur","ror":"https://ror.org/00gnrwz95","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210091683"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Pascal Dugenie","raw_affiliation_strings":["CINES, Centre Informatique National de l'Enseignement Superieur, Montpellier, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"CINES, Centre Informatique National de l'Enseignement Superieur, Montpellier, France","institution_ids":["https://openalex.org/I4210091683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085617401","display_name":"Nuno Freire","orcid":"https://orcid.org/0000-0002-3632-8046"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nuno Freire","raw_affiliation_strings":["INESC-ID/Europeana DSI, Den Haag, NL"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"INESC-ID/Europeana DSI, Den Haag, NL","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5076410186","display_name":"Daan Broeder","orcid":"https://orcid.org/0000-0002-8446-3410"},"institutions":[{"id":"https://openalex.org/I4210158762","display_name":"Meertens Institute","ror":"https://ror.org/05kaxyq51","country_code":"NL","type":"facility","lineage":["https://openalex.org/I1322597698","https://openalex.org/I4210158762"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Daan Broeder","raw_affiliation_strings":["MEERTENS Institut (Afdeling Technische Ontwikkeling), Amsterdam, NL"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"MEERTENS Institut (Afdeling Technische Ontwikkeling), Amsterdam, NL","institution_ids":["https://openalex.org/I4210158762"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.5064,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.77634215,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"24","issue":null,"first_page":"2231","last_page":"2239"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11937","display_name":"Research Data Management Practices","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11937","display_name":"Research Data Management Practices","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.991599977016449,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9836000204086304,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cultural-heritage","display_name":"Cultural heritage","score":0.6959831714630127},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6853194236755371},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.6823645830154419},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.6417607069015503},{"id":"https://openalex.org/keywords/linked-data","display_name":"Linked data","score":0.4837627410888672},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.4772886335849762},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.4695834517478943},{"id":"https://openalex.org/keywords/knowledge-extraction","display_name":"Knowledge extraction","score":0.44398176670074463},{"id":"https://openalex.org/keywords/knowledge-management","display_name":"Knowledge management","score":0.3583309054374695},{"id":"https://openalex.org/keywords/semantic-web","display_name":"Semantic Web","score":0.2320345640182495},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.16189250349998474},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.1194237470626831},{"id":"https://openalex.org/keywords/archaeology","display_name":"Archaeology","score":0.110798180103302}],"concepts":[{"id":"https://openalex.org/C60671577","wikidata":"https://www.wikidata.org/wiki/Q210272","display_name":"Cultural heritage","level":2,"score":0.6959831714630127},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6853194236755371},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.6823645830154419},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.6417607069015503},{"id":"https://openalex.org/C69075417","wikidata":"https://www.wikidata.org/wiki/Q515701","display_name":"Linked data","level":3,"score":0.4837627410888672},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.4772886335849762},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.4695834517478943},{"id":"https://openalex.org/C120567893","wikidata":"https://www.wikidata.org/wiki/Q1582085","display_name":"Knowledge extraction","level":2,"score":0.44398176670074463},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.3583309054374695},{"id":"https://openalex.org/C2129575","wikidata":"https://www.wikidata.org/wiki/Q54837","display_name":"Semantic Web","level":2,"score":0.2320345640182495},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.16189250349998474},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.1194237470626831},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.110798180103302},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata.2017.8258174","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2017.8258174","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","score":0.550000011920929,"display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W1547210326","https://openalex.org/W2001848404","https://openalex.org/W2042932925","https://openalex.org/W2063516906","https://openalex.org/W2100178820","https://openalex.org/W2140623652","https://openalex.org/W2159024099","https://openalex.org/W2554301102","https://openalex.org/W2584335649","https://openalex.org/W2585043100","https://openalex.org/W2585496165","https://openalex.org/W2885792208","https://openalex.org/W3049031626","https://openalex.org/W6748082880"],"related_works":["https://openalex.org/W4390608645","https://openalex.org/W4247566972","https://openalex.org/W4394895745","https://openalex.org/W2960264696","https://openalex.org/W3090563135","https://openalex.org/W2497432351","https://openalex.org/W4206777497","https://openalex.org/W2910064364","https://openalex.org/W4200136508","https://openalex.org/W2499527417"],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"approaches":[3],"for":[4,55,94,139],"building":[5],"new":[6,155],"knowledge":[7,174,190],"using":[8],"emerging":[9],"methods":[10],"and":[11,34,105,127,175,181,189],"big":[12,186],"data":[13,89,125,142,180,187],"technologies":[14],"together":[15,128],"with":[16,32,72,129],"archival":[17,163],"practices.":[18],"Two":[19],"cases":[20],"studies":[21,65],"have":[22],"been":[23],"considered.":[24],"The":[25,39,58],"first":[26],"one":[27,41],"called":[28,42],"HERBADROP":[29,85],"is":[30,66,116],"concerned":[31,71],"preservation":[33],"analysis":[35],"of":[36,50,75,108,119,121,161,170],"herbarium":[37],"images.":[38],"second":[40],"EUROPEANA":[43,98],"investigates":[44],"how":[45,149],"to":[46,102,134],"facilitate":[47],"the":[48,73,80,88,122,159,168],"re-use":[49],"cultural":[51,109],"heritage":[52,77,110],"language":[53],"resources":[54,78],"research":[56,131,141,156],"purposes.":[57],"common":[59,137],"point":[60],"between":[61],"these":[62],"two":[63],"case":[64],"that":[67],"they":[68],"are":[69],"both":[70],"use":[74],"valuable":[76],"within":[79],"EUDAT":[81,93,101,112],"(European":[82],"Data)":[83],"infrastructure.":[84],"leverages":[86,99],"on":[87,100],"services":[90],"provided":[91],"by":[92],"long-term":[95],"preservation,":[96],"while":[97],"achieve":[103],"citability":[104],"persistent":[106],"identification":[107],"datasets.":[111],"<sup":[113],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[114],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">1</sup>":[115],"an":[117],"initiative":[118],"some":[120,154],"main":[123],"European":[124],"centers":[126],"community":[130],"infrastructure":[132],"organisations,":[133],"build":[135],"a":[136],"eInfrastructure":[138],"general":[140],"management.":[143],"In":[144],"this":[145],"paper,":[146],"we":[147],"show":[148],"technologcal":[150],"trends":[151],"may":[152],"offer":[153],"potential":[157],"in":[158,165],"domain":[160],"computational":[162],"science":[164],"particular":[166],"appraising":[167],"challenges":[169],"producing":[171],"quality,":[172],"meaning,":[173],"value":[176],"from":[177],"quantity,":[178],"tracing":[179],"analytic":[182],"provenance":[183],"across":[184],"complex":[185],"platforms":[188],"production":[191],"ecosystems.":[192]},"counts_by_year":[{"year":2020,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
