{"id":"https://openalex.org/W7138922462","doi":"https://doi.org/10.48550/arxiv.2603.15711","title":"Knowledge Graph Extraction from Biomedical Literature for Alkaptonuria Rare Disease","display_name":"Knowledge Graph Extraction from Biomedical Literature for Alkaptonuria Rare Disease","publication_year":2026,"publication_date":"2026-03-16","ids":{"openalex":"https://openalex.org/W7138922462","doi":"https://doi.org/10.48550/arxiv.2603.15711"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.15711","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15711","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.15711","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111120344","display_name":"Giang L. T. Pham","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Pham, Giang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5094358617","display_name":"Rebecca Finetti","orcid":"https://orcid.org/0009-0000-6969-1493"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Finetti, Rebecca","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130128763","display_name":"Caterina Graziani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Graziani, Caterina","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059180587","display_name":"Bianca Roncaglia","orcid":"https://orcid.org/0009-0002-0009-4011"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Roncaglia, Bianca","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130034303","display_name":"Asma Bendjeddou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bendjeddou, Asma","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129836215","display_name":"Linda Brodo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Brodo, Linda","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051761627","display_name":"Sara Brunetti","orcid":"https://orcid.org/0000-0001-9365-8335"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Brunetti, Sara","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053216941","display_name":"Moreno Falaschi","orcid":"https://orcid.org/0000-0002-6659-3828"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Falaschi, Moreno","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130114856","display_name":"Stefano Forti","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Forti, Stefano","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128576617","display_name":"Silvia Giulia Galfr\u00e9","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Galfr\u00e9, Silvia Giulia","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129946981","display_name":"Paolo Milazzo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Milazzo, Paolo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028775661","display_name":"Corrado Priami","orcid":"https://orcid.org/0000-0002-3261-6235"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Priami, Corrado","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021170470","display_name":"Annalisa Santucci","orcid":"https://orcid.org/0000-0001-6976-9086"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Santucci, Annalisa","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091710523","display_name":"Ottavia Spiga","orcid":"https://orcid.org/0000-0002-0263-7107"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Spiga, Ottavia","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130068379","display_name":"Alina S\u00eerbu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"S\u00eerbu, Alina","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":15,"corresponding_author_ids":["https://openalex.org/A5111120344"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11027","display_name":"Metabolism and Genetic Disorders","score":0.6945000290870667,"subfield":{"id":"https://openalex.org/subfields/1308","display_name":"Clinical Biochemistry"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11027","display_name":"Metabolism and Genetic Disorders","score":0.6945000290870667,"subfield":{"id":"https://openalex.org/subfields/1308","display_name":"Clinical Biochemistry"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11642","display_name":"Genomics and Rare Diseases","score":0.09449999779462814,"subfield":{"id":"https://openalex.org/subfields/1311","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12915","display_name":"Biochemical Acid Research Studies","score":0.018400000408291817,"subfield":{"id":"https://openalex.org/subfields/1303","display_name":"Biochemistry"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/alkaptonuria","display_name":"Alkaptonuria","score":0.9297000169754028},{"id":"https://openalex.org/keywords/homogentisic-acid","display_name":"Homogentisic acid","score":0.8585000038146973},{"id":"https://openalex.org/keywords/disease","display_name":"Disease","score":0.6417999863624573},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.4887000024318695},{"id":"https://openalex.org/keywords/metabolic-disease","display_name":"Metabolic disease","score":0.48170000314712524},{"id":"https://openalex.org/keywords/ochronosis","display_name":"Ochronosis","score":0.4318999946117401},{"id":"https://openalex.org/keywords/pathological","display_name":"Pathological","score":0.42149999737739563},{"id":"https://openalex.org/keywords/knowledge-graph","display_name":"Knowledge graph","score":0.33480000495910645}],"concepts":[{"id":"https://openalex.org/C2776743390","wikidata":"https://www.wikidata.org/wiki/Q651680","display_name":"Alkaptonuria","level":2,"score":0.9297000169754028},{"id":"https://openalex.org/C2776255415","wikidata":"https://www.wikidata.org/wiki/Q416054","display_name":"Homogentisic acid","level":2,"score":0.8585000038146973},{"id":"https://openalex.org/C2779134260","wikidata":"https://www.wikidata.org/wiki/Q12136","display_name":"Disease","level":2,"score":0.6417999863624573},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.4887000024318695},{"id":"https://openalex.org/C2991848491","wikidata":"https://www.wikidata.org/wiki/Q2351083","display_name":"Metabolic disease","level":2,"score":0.48170000314712524},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.46619999408721924},{"id":"https://openalex.org/C2777169657","wikidata":"https://www.wikidata.org/wiki/Q1507609","display_name":"Ochronosis","level":2,"score":0.4318999946117401},{"id":"https://openalex.org/C207886595","wikidata":"https://www.wikidata.org/wiki/Q1456138","display_name":"Pathological","level":2,"score":0.42149999737739563},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.3930000066757202},{"id":"https://openalex.org/C60644358","wikidata":"https://www.wikidata.org/wiki/Q128570","display_name":"Bioinformatics","level":1,"score":0.3677000105381012},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.36329999566078186},{"id":"https://openalex.org/C2987255567","wikidata":"https://www.wikidata.org/wiki/Q33002955","display_name":"Knowledge graph","level":2,"score":0.33480000495910645},{"id":"https://openalex.org/C47042493","wikidata":"https://www.wikidata.org/wiki/Q265799","display_name":"Human genetics","level":3,"score":0.32269999384880066},{"id":"https://openalex.org/C2779701055","wikidata":"https://www.wikidata.org/wiki/Q929833","display_name":"Rare disease","level":3,"score":0.3109999895095825},{"id":"https://openalex.org/C2777735490","wikidata":"https://www.wikidata.org/wiki/Q2351083","display_name":"Metabolic disorder","level":2,"score":0.29499998688697815},{"id":"https://openalex.org/C3018605307","wikidata":"https://www.wikidata.org/wiki/Q200779","display_name":"Complex disease","level":3,"score":0.2838999927043915},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.28380000591278076},{"id":"https://openalex.org/C120567893","wikidata":"https://www.wikidata.org/wiki/Q1582085","display_name":"Knowledge extraction","level":2,"score":0.27900001406669617},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.271699994802475},{"id":"https://openalex.org/C2779473830","wikidata":"https://www.wikidata.org/wiki/Q1540899","display_name":"MEDLINE","level":2,"score":0.26100000739097595},{"id":"https://openalex.org/C2777466982","wikidata":"https://www.wikidata.org/wiki/Q5227287","display_name":"Data extraction","level":3,"score":0.25270000100135803},{"id":"https://openalex.org/C22593422","wikidata":"https://www.wikidata.org/wiki/Q3242583","display_name":"Pedigree chart","level":3,"score":0.25189998745918274}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.15711","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15711","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.15711","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15711","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.567659854888916,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Alkaptonuria":[0],"(AKU)":[1],"is":[2,57,90],"an":[3],"ultra-rare":[4],"autosomal":[5],"recessive":[6],"metabolic":[7,168],"disorder":[8],"caused":[9],"by":[10],"mutations":[11],"in":[12,27,60,96,165],"the":[13,49,55,73,77,147,151,160],"HGD":[14],"(Homogentisate":[15],"1,2-Dioxygenase)":[16],"gene,":[17],"leading":[18],"to":[19,34,54,133,141],"a":[20,105],"pathological":[21],"accumulation":[22],"of":[23,51,62,114,121,150,162],"homogentisic":[24],"acid":[25],"(HGA)":[26],"body":[28],"fluids":[29],"and":[30,41,44,65,82,130,137,155],"tissues.":[31],"This":[32,143],"leads":[33],"systemic":[35,148],"manifestations,":[36],"including":[37],"premature":[38],"spondyloarthropathy,":[39],"renal":[40],"prostatic":[42],"stones,":[43],"cardiovascular":[45],"complications.":[46],"Being":[47],"ultra-rare,":[48],"amount":[50],"data":[52,64],"related":[53,140],"disease":[56,78],"limited,":[58],"both":[59],"terms":[61],"clinical":[63],"literature.":[66],"Knowledge":[67],"graphs":[68],"(KGs)":[69],"can":[70],"help":[71],"connect":[72],"limited":[74],"knowledge":[75,129],"about":[76],"(basic":[79],"mechanisms,":[80],"manifestations":[81],"existing":[83,97,127],"therapies)":[84],"with":[85],"other":[86],"knowledge;":[87],"however,":[88],"AKU":[89],"frequently":[91],"underrepresented":[92],"or":[93],"entirely":[94],"absent":[95],"biomedical":[98,115],"KGs.":[99],"In":[100],"this":[101],"work,":[102],"we":[103],"apply":[104],"text-mining":[106],"methodology":[107],"based":[108],"on":[109],"PubTator3":[110],"for":[111],"large-scale":[112],"extraction":[113],"relations.":[116],"We":[117],"construct":[118],"two":[119],"KGs":[120],"different":[122],"sizes,":[123],"validate":[124],"them":[125,132],"using":[126],"biochemical":[128],"use":[131],"extract":[134],"genes,":[135],"diseases":[136],"therapies":[138],"possibly":[139],"AKU.":[142],"computational":[144],"framework":[145],"reveals":[146],"interactions":[149],"disease,":[152],"its":[153],"comorbidities,":[154],"potential":[156],"therapeutic":[157],"targets,":[158],"demonstrating":[159],"efficacy":[161],"our":[163],"approach":[164],"analyzing":[166],"rare":[167],"disorders.":[169]},"counts_by_year":[],"updated_date":"2026-03-20T20:54:20.808490","created_date":"2026-03-20T00:00:00"}
