{"id":"https://openalex.org/W4320024148","doi":"https://doi.org/10.1109/bigdata55660.2022.10020716","title":"Wikidata-lite for Knowledge Extraction and Exploration","display_name":"Wikidata-lite for Knowledge Extraction and Exploration","publication_year":2022,"publication_date":"2022-12-17","ids":{"openalex":"https://openalex.org/W4320024148","doi":"https://doi.org/10.1109/bigdata55660.2022.10020716"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata55660.2022.10020716","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata55660.2022.10020716","pdf_url":null,"source":{"id":"https://openalex.org/S4363607709","display_name":"2022 IEEE International Conference on Big Data (Big Data)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101682562","display_name":"Phuc Nguyen","orcid":"https://orcid.org/0000-0003-1679-723X"},"institutions":[{"id":"https://openalex.org/I184597095","display_name":"National Institute of Informatics","ror":"https://ror.org/04ksd4g47","country_code":"JP","type":"facility","lineage":["https://openalex.org/I1319490839","https://openalex.org/I184597095","https://openalex.org/I4210158934"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Phuc Nguyen","raw_affiliation_strings":["National Institute of Informatics,Japan","National Institute of Informatics, Japan"],"affiliations":[{"raw_affiliation_string":"National Institute of Informatics,Japan","institution_ids":["https://openalex.org/I184597095"]},{"raw_affiliation_string":"National Institute of Informatics, Japan","institution_ids":["https://openalex.org/I184597095"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043917711","display_name":"Hideaki Takeda","orcid":"https://orcid.org/0000-0002-2909-7163"},"institutions":[{"id":"https://openalex.org/I184597095","display_name":"National Institute of Informatics","ror":"https://ror.org/04ksd4g47","country_code":"JP","type":"facility","lineage":["https://openalex.org/I1319490839","https://openalex.org/I184597095","https://openalex.org/I4210158934"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hideaki Takeda","raw_affiliation_strings":["National Institute of Informatics,Japan","National Institute of Informatics, Japan"],"affiliations":[{"raw_affiliation_string":"National Institute of Informatics,Japan","institution_ids":["https://openalex.org/I184597095"]},{"raw_affiliation_string":"National Institute of Informatics, Japan","institution_ids":["https://openalex.org/I184597095"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5101682562"],"corresponding_institution_ids":["https://openalex.org/I184597095"],"apc_list":null,"apc_paid":null,"fwci":0.2078,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.46245421,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"3684","last_page":"3686"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9921000003814697,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8655605316162109},{"id":"https://openalex.org/keywords/sparql","display_name":"SPARQL","score":0.6546679735183716},{"id":"https://openalex.org/keywords/knowledge-graph","display_name":"Knowledge graph","score":0.6206166744232178},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5738113522529602},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.48895537853240967},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.4782111346721649},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.39852097630500793},{"id":"https://openalex.org/keywords/rdf","display_name":"RDF","score":0.21581557393074036},{"id":"https://openalex.org/keywords/semantic-web","display_name":"Semantic Web","score":0.18522590398788452}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8655605316162109},{"id":"https://openalex.org/C41009113","wikidata":"https://www.wikidata.org/wiki/Q54871","display_name":"SPARQL","level":4,"score":0.6546679735183716},{"id":"https://openalex.org/C2987255567","wikidata":"https://www.wikidata.org/wiki/Q33002955","display_name":"Knowledge graph","level":2,"score":0.6206166744232178},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5738113522529602},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.48895537853240967},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4782111346721649},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.39852097630500793},{"id":"https://openalex.org/C147497476","wikidata":"https://www.wikidata.org/wiki/Q54872","display_name":"RDF","level":3,"score":0.21581557393074036},{"id":"https://openalex.org/C2129575","wikidata":"https://www.wikidata.org/wiki/Q54837","display_name":"Semantic Web","level":2,"score":0.18522590398788452},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata55660.2022.10020716","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata55660.2022.10020716","pdf_url":null,"source":{"id":"https://openalex.org/S4363607709","display_name":"2022 IEEE International Conference on Big Data (Big Data)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":5,"referenced_works":["https://openalex.org/W2080133951","https://openalex.org/W3109507892","https://openalex.org/W6802165776","https://openalex.org/W6803052437","https://openalex.org/W6987030581"],"related_works":["https://openalex.org/W2038821533","https://openalex.org/W2295889387","https://openalex.org/W76044956","https://openalex.org/W129667569","https://openalex.org/W3142934089","https://openalex.org/W2528665947","https://openalex.org/W2764264137","https://openalex.org/W4297737180","https://openalex.org/W2226235235","https://openalex.org/W2899333420"],"abstract_inverted_index":{"Wikidata":[0,105],"is":[1,34,114],"the":[2,28,103],"largest":[3],"collaborative":[4],"general":[5],"knowledge":[6,19,76],"graph":[7],"supported":[8],"by":[9,89],"a":[10,38,68,72],"worldwide":[11],"community.":[12],"It":[13],"includes":[14],"many":[15,57],"helpful":[16],"topics":[17],"for":[18,75,108],"exploration":[20],"and":[21,78,97],"data":[22,42],"science":[23],"applications.":[24],"However,":[25],"due":[26],"to":[27,36,70],"enormous":[29],"size":[30],"of":[31,41,45],"Wikidata,":[32],"it":[33],"challenging":[35],"retrieve":[37],"large":[39,51],"amount":[40],"with":[43],"millions":[44],"results,":[46],"make":[47],"complex":[48],"queries":[49],"requiring":[50],"aggregation":[52],"operations,":[53],"or":[54,86],"access":[55],"too":[56],"statement":[58],"references.":[59],"This":[60],"paper":[61],"introduces":[62],"our":[63],"preliminary":[64],"works":[65],"on":[66],"Wikidata-lite,":[67],"toolkit":[69],"build":[71],"database":[73],"offline":[74],"extraction":[77],"exploration,":[79],"e.g.,":[80],"retrieving":[81],"item":[82],"information,":[83],"statements,":[84],"provenances,":[85],"searching":[87],"entities":[88],"their":[90],"keywords,":[91],"attributes.":[92],"Wikidata-lite":[93,112],"has":[94],"high":[95],"performance":[96],"memory":[98],"efficiency,":[99],"much":[100],"faster":[101],"than":[102],"official":[104],"SPARQL":[106],"endpoint":[107],"big":[109],"queries.":[110],"The":[111],"repository":[113],"available":[115],"at":[116],"https://github.com/phucty/wikidb.":[117]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2026-01-13T01:12:25.745995","created_date":"2025-10-10T00:00:00"}
