{"id":"https://openalex.org/W4280530336","doi":"https://doi.org/10.1007/978-3-031-05936-0_37","title":"An Adaptable Indexing Pipeline for\u00a0Enriching Meta Information of\u00a0Datasets from\u00a0Heterogeneous Repositories","display_name":"An Adaptable Indexing Pipeline for\u00a0Enriching Meta Information of\u00a0Datasets from\u00a0Heterogeneous Repositories","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4280530336","doi":"https://doi.org/10.1007/978-3-031-05936-0_37"},"language":"en","primary_location":{"id":"doi:10.1007/978-3-031-05936-0_37","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-031-05936-0_37","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://pure.uva.nl/ws/files/117788060/2022.conference.akdd.caera.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041493190","display_name":"Siamak Farshidi","orcid":"https://orcid.org/0000-0001-6139-921X"},"institutions":[{"id":"https://openalex.org/I887064364","display_name":"University of Amsterdam","ror":"https://ror.org/04dkp9463","country_code":"NL","type":"education","lineage":["https://openalex.org/I887064364"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Siamak Farshidi","raw_affiliation_strings":["Multiscale Networked Systems, University of Amsterdam, Amsterdam, The Netherlands"],"affiliations":[{"raw_affiliation_string":"Multiscale Networked Systems, University of Amsterdam, Amsterdam, The Netherlands","institution_ids":["https://openalex.org/I887064364"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5068341719","display_name":"Zhiming Zhao","orcid":"https://orcid.org/0000-0002-6717-9418"},"institutions":[{"id":"https://openalex.org/I887064364","display_name":"University of Amsterdam","ror":"https://ror.org/04dkp9463","country_code":"NL","type":"education","lineage":["https://openalex.org/I887064364"]}],"countries":["NL"],"is_corresponding":true,"raw_author_name":"Zhiming Zhao","raw_affiliation_strings":["Multiscale Networked Systems, University of Amsterdam, Amsterdam, The Netherlands"],"affiliations":[{"raw_affiliation_string":"Multiscale Networked Systems, University of Amsterdam, Amsterdam, The Netherlands","institution_ids":["https://openalex.org/I887064364"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5068341719"],"corresponding_institution_ids":["https://openalex.org/I887064364"],"apc_list":{"value":5000,"currency":"EUR","value_usd":5392},"apc_paid":null,"fwci":6.3086,"has_fulltext":true,"cited_by_count":10,"citation_normalized_percentile":{"value":0.96867331,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"472","last_page":"484"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11937","display_name":"Research Data Management Practices","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11937","display_name":"Research Data Management Practices","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9833999872207642,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8637988567352295},{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.7592732906341553},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.6716106534004211},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6325567960739136},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5901973843574524},{"id":"https://openalex.org/keywords/interoperability","display_name":"Interoperability","score":0.5161474943161011},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.504639744758606},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.49197790026664734},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.4903745651245117},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.4561646580696106},{"id":"https://openalex.org/keywords/publication","display_name":"Publication","score":0.4337003827095032},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.36899614334106445}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8637988567352295},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.7592732906341553},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.6716106534004211},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6325567960739136},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5901973843574524},{"id":"https://openalex.org/C20136886","wikidata":"https://www.wikidata.org/wiki/Q749647","display_name":"Interoperability","level":2,"score":0.5161474943161011},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.504639744758606},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.49197790026664734},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.4903745651245117},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.4561646580696106},{"id":"https://openalex.org/C41458344","wikidata":"https://www.wikidata.org/wiki/Q732577","display_name":"Publication","level":2,"score":0.4337003827095032},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.36899614334106445},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C112698675","wikidata":"https://www.wikidata.org/wiki/Q37038","display_name":"Advertising","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.1007/978-3-031-05936-0_37","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-031-05936-0_37","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},{"id":"pmh:oai:dare.uva.nl:publications/4073a479-1d25-4c9b-9da1-5e78181a1704","is_oa":true,"landing_page_url":"https://handle.uba.uva.nl/personal/pure/en/publications/an-adaptable-indexing-pipeline-forenriching-meta-information-ofdatasets-fromheterogeneous-repositories(4073a479-1d25-4c9b-9da1-5e78181a1704).html","pdf_url":"https://pure.uva.nl/ws/files/117788060/2022.conference.akdd.caera.pdf","source":{"id":"https://openalex.org/S4306400088","display_name":"UvA-DARE (University of Amsterdam)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I887064364","host_organization_name":"University of Amsterdam","host_organization_lineage":["https://openalex.org/I887064364"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Farshidi, S & Zhao, Z 2022, An Adaptable Indexing Pipeline for\u00a0Enriching Meta Information of\u00a0Datasets from\u00a0Heterogeneous Repositories. in J Gama, T Li, Y Yu, E Chen, Y Zheng & F Teng (eds), Advances in Knowledge Discovery and Data Mining : 26th Pacific-Asia Conference, PAKDD 2022, Chengdu, China, May 16\u201319, 2022 : proceedings. vol. II, Lecture Notes in Computer Science, vol. 13281, Lecture Notes in Artificial Intelligence, Cham, pp. 472-484, 26th Pacific-Asia Conference on Knowledge Discovery and Data Mining, PAKDD 2022, Chengdu, China, 16/05/22. https://doi.org/10.1007/978-3-031-05936-0_37","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:zenodo.org:6555644","is_oa":true,"landing_page_url":"https://zenodo.org/record/6555644","pdf_url":"https://zenodo.org/record/6555644","source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/conferencePaper"},{"id":"pmh:oai:dare.uva.nl:openaire_cris_publications/4073a479-1d25-4c9b-9da1-5e78181a1704","is_oa":true,"landing_page_url":"https://hdl.handle.net/11245.1/4073a479-1d25-4c9b-9da1-5e78181a1704","pdf_url":null,"source":{"id":"https://openalex.org/S4306400088","display_name":"UvA-DARE (University of Amsterdam)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I887064364","host_organization_name":"University of Amsterdam","host_organization_lineage":["https://openalex.org/I887064364"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Farshidi, S & Zhao, Z 2022, An Adaptable Indexing Pipeline for\u00a0Enriching Meta Information of\u00a0Datasets from\u00a0Heterogeneous Repositories. in J Gama, T Li, Y Yu, E Chen, Y Zheng & F Teng (eds), Advances in Knowledge Discovery and Data Mining : 26th Pacific-Asia Conference, PAKDD 2022, Chengdu, China, May 16\u201319, 2022 : proceedings. vol. II, Lecture Notes in Computer Science, vol. 13281, Lecture Notes in Artificial Intelligence, Cham, pp. 472-484, 26th Pacific-Asia Conference on Knowledge Discovery and Data Mining, PAKDD 2022, Chengdu, China, 16/05/22. https://doi.org/10.1007/978-3-031-05936-0_37","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:uvapub:oai:dare.uva.nl:openaire_cris_publications/4073a479-1d25-4c9b-9da1-5e78181a1704","is_oa":true,"landing_page_url":"https://dare.uva.nl/personal/pure/en/publications/an-adaptable-indexing-pipeline-forenriching-meta-information-ofdatasets-fromheterogeneous-repositories(4073a479-1d25-4c9b-9da1-5e78181a1704).html","pdf_url":null,"source":{"id":"https://openalex.org/S4306401843","display_name":"Data Archiving and Networked Services (DANS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1322597698","host_organization_name":"Royal Netherlands Academy of Arts and Sciences","host_organization_lineage":["https://openalex.org/I1322597698"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Advances in Knowledge Discovery and Data Mining: 26th Pacific-Asia Conference, PAKDD 2022, Chengdu, China, May 16\u201319, 2022 : proceedings, II, 472 - 484","raw_type":"info:eu-repo/semantics/conferencepaper"}],"best_oa_location":{"id":"pmh:oai:dare.uva.nl:publications/4073a479-1d25-4c9b-9da1-5e78181a1704","is_oa":true,"landing_page_url":"https://handle.uba.uva.nl/personal/pure/en/publications/an-adaptable-indexing-pipeline-forenriching-meta-information-ofdatasets-fromheterogeneous-repositories(4073a479-1d25-4c9b-9da1-5e78181a1704).html","pdf_url":"https://pure.uva.nl/ws/files/117788060/2022.conference.akdd.caera.pdf","source":{"id":"https://openalex.org/S4306400088","display_name":"UvA-DARE (University of Amsterdam)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I887064364","host_organization_name":"University of Amsterdam","host_organization_lineage":["https://openalex.org/I887064364"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Farshidi, S & Zhao, Z 2022, An Adaptable Indexing Pipeline for\u00a0Enriching Meta Information of\u00a0Datasets from\u00a0Heterogeneous Repositories. in J Gama, T Li, Y Yu, E Chen, Y Zheng & F Teng (eds), Advances in Knowledge Discovery and Data Mining : 26th Pacific-Asia Conference, PAKDD 2022, Chengdu, China, May 16\u201319, 2022 : proceedings. vol. II, Lecture Notes in Computer Science, vol. 13281, Lecture Notes in Artificial Intelligence, Cham, pp. 472-484, 26th Pacific-Asia Conference on Knowledge Discovery and Data Mining, PAKDD 2022, Chengdu, China, 16/05/22. https://doi.org/10.1007/978-3-031-05936-0_37","raw_type":"info:eu-repo/semantics/publishedVersion"},"sustainable_development_goals":[{"score":0.5400000214576721,"display_name":"Life below water","id":"https://metadata.un.org/sdg/14"}],"awards":[{"id":"https://openalex.org/G3912856170","display_name":null,"funder_award_id":"824068","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G4956428346","display_name":null,"funder_award_id":"Horizon 2020 research and innovatio","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G7761236267","display_name":null,"funder_award_id":"862409","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G8318064016","display_name":null,"funder_award_id":"Horizon","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G8764417039","display_name":"smART socIal media eCOsytstem in a blockchaiN Federated environment","funder_award_id":"825134","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"}],"funders":[{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4280530336.pdf","grobid_xml":"https://content.openalex.org/works/W4280530336.grobid-xml"},"referenced_works_count":25,"referenced_works":["https://openalex.org/W173587568","https://openalex.org/W1576228976","https://openalex.org/W1968927634","https://openalex.org/W1978210737","https://openalex.org/W2073303515","https://openalex.org/W2148117599","https://openalex.org/W2148738951","https://openalex.org/W2168332560","https://openalex.org/W2598446296","https://openalex.org/W2750856415","https://openalex.org/W2752618741","https://openalex.org/W2787908404","https://openalex.org/W2804310261","https://openalex.org/W2901376054","https://openalex.org/W2926805670","https://openalex.org/W2950031835","https://openalex.org/W2969723769","https://openalex.org/W3002636616","https://openalex.org/W3086726503","https://openalex.org/W3124325695","https://openalex.org/W3125261728","https://openalex.org/W3173088060","https://openalex.org/W4233925072","https://openalex.org/W6631393269","https://openalex.org/W6906493647"],"related_works":["https://openalex.org/W2392768766","https://openalex.org/W2058118494","https://openalex.org/W2095118173","https://openalex.org/W2382021449","https://openalex.org/W2104269053","https://openalex.org/W2106424170","https://openalex.org/W2093262417","https://openalex.org/W2501188010","https://openalex.org/W4299935056","https://openalex.org/W2768810474"],"abstract_inverted_index":null,"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":2}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
