{"id":"https://openalex.org/W4406460256","doi":"https://doi.org/10.1109/bigdata62323.2024.10825404","title":"Tackling Data Sparsity and Combinatorial Challenges in Rare Disease Matching with Medical Informed Machine Learning","display_name":"Tackling Data Sparsity and Combinatorial Challenges in Rare Disease Matching with Medical Informed Machine Learning","publication_year":2024,"publication_date":"2024-12-15","ids":{"openalex":"https://openalex.org/W4406460256","doi":"https://doi.org/10.1109/bigdata62323.2024.10825404"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata62323.2024.10825404","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata62323.2024.10825404","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5046384370","display_name":"Armin Berger","orcid":"https://orcid.org/0000-0003-3109-4372"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Armin Berger","raw_affiliation_strings":["Fraunhofer IAIS,Department of Media Engineering,Germany"],"affiliations":[{"raw_affiliation_string":"Fraunhofer IAIS,Department of Media Engineering,Germany","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115904952","display_name":"Tom Anglim Lagones","orcid":null},"institutions":[{"id":"https://openalex.org/I1302211766","display_name":"Queensland Health","ror":"https://ror.org/00c1dt378","country_code":"AU","type":"government","lineage":["https://openalex.org/I1302211766","https://openalex.org/I2801244131"]},{"id":"https://openalex.org/I2800882159","display_name":"Government of Western Australia Department of Health","ror":"https://ror.org/01epcny94","country_code":"AU","type":"government","lineage":["https://openalex.org/I2799506148","https://openalex.org/I2800882159"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Tom Anglim Lagones","raw_affiliation_strings":["Department of Health Queensland,Australia"],"affiliations":[{"raw_affiliation_string":"Department of Health Queensland,Australia","institution_ids":["https://openalex.org/I1302211766","https://openalex.org/I2800882159"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024722052","display_name":"Lorenz Grigull","orcid":"https://orcid.org/0000-0001-8807-2874"},"institutions":[{"id":"https://openalex.org/I2799391451","display_name":"University Hospital Bonn","ror":"https://ror.org/01xnwqx93","country_code":"DE","type":"healthcare","lineage":["https://openalex.org/I2799391451"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Lorenz Grigull","raw_affiliation_strings":["University Hospital Bonn - Center for Rare Diseases,Germany"],"affiliations":[{"raw_affiliation_string":"University Hospital Bonn - Center for Rare Diseases,Germany","institution_ids":["https://openalex.org/I2799391451"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115904953","display_name":"Lara Fendrich","orcid":null},"institutions":[{"id":"https://openalex.org/I2799391451","display_name":"University Hospital Bonn","ror":"https://ror.org/01xnwqx93","country_code":"DE","type":"healthcare","lineage":["https://openalex.org/I2799391451"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Lara Fendrich","raw_affiliation_strings":["University Hospital Bonn - Center for Rare Diseases,Germany"],"affiliations":[{"raw_affiliation_string":"University Hospital Bonn - Center for Rare Diseases,Germany","institution_ids":["https://openalex.org/I2799391451"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110721074","display_name":"Thiago Bell","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Thiago Bell","raw_affiliation_strings":["Fraunhofer IAIS,Department of Media Engineering,Germany"],"affiliations":[{"raw_affiliation_string":"Fraunhofer IAIS,Department of Media Engineering,Germany","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115904954","display_name":"Henriette H\u00f6gl","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Henriette H\u00f6gl","raw_affiliation_strings":["Children&#x2019;s Network for Chronic Illnesses and Disabilities,Germany"],"affiliations":[{"raw_affiliation_string":"Children&#x2019;s Network for Chronic Illnesses and Disabilities,Germany","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108620260","display_name":"Gundula Ernst","orcid":"https://orcid.org/0000-0002-2483-7206"},"institutions":[{"id":"https://openalex.org/I34809795","display_name":"Medizinische Hochschule Hannover","ror":"https://ror.org/00f2yqf98","country_code":"DE","type":"education","lineage":["https://openalex.org/I34809795"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Gundula Ernst","raw_affiliation_strings":["Medical School Hannover,Department of Medical Psychology,Germany"],"affiliations":[{"raw_affiliation_string":"Medical School Hannover,Department of Medical Psychology,Germany","institution_ids":["https://openalex.org/I34809795"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077321509","display_name":"Ralf Schmidt","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ralf Schmidt","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115904955","display_name":"David Bascom","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"David Bascom","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034781887","display_name":"Rafet Sifa","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rafet Sifa","raw_affiliation_strings":["Fraunhofer IAIS,Department of Media Engineering,Germany"],"affiliations":[{"raw_affiliation_string":"Fraunhofer IAIS,Department of Media Engineering,Germany","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039510770","display_name":"Max L\u00fcbbering","orcid":"https://orcid.org/0000-0001-6291-9459"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Max L\u00fcbbering","raw_affiliation_strings":["Fraunhofer IAIS,Department of Media Engineering,Germany"],"affiliations":[{"raw_affiliation_string":"Fraunhofer IAIS,Department of Media Engineering,Germany","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":11,"corresponding_author_ids":["https://openalex.org/A5046384370"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.4504,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.85874113,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"6430","last_page":"6438"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11396","display_name":"Artificial Intelligence in Healthcare","score":0.991599977016449,"subfield":{"id":"https://openalex.org/subfields/3605","display_name":"Health Information Management"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11642","display_name":"Genomics and Rare Diseases","score":0.9818999767303467,"subfield":{"id":"https://openalex.org/subfields/1311","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6806572675704956},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.6775785684585571},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5933244228363037},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.568367600440979},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.3252195119857788},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.193454772233963}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6806572675704956},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.6775785684585571},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5933244228363037},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.568367600440979},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3252195119857788},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.193454772233963},{"id":"https://openalex.org/C142724271","wikidata":"https://www.wikidata.org/wiki/Q7208","display_name":"Pathology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/bigdata62323.2024.10825404","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata62323.2024.10825404","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"},{"id":"pmh:oai:publica.fraunhofer.de:publica/499881","is_oa":false,"landing_page_url":"https://publica.fraunhofer.de/handle/publica/499881","pdf_url":null,"source":{"id":"https://openalex.org/S4306400318","display_name":"Fraunhofer-Publica (Fraunhofer-Gesellschaft)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4923324","host_organization_name":"Fraunhofer-Gesellschaft","host_organization_lineage":["https://openalex.org/I4923324"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"conference paper"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320311687","display_name":"Ministry of Education","ror":"https://ror.org/03m01yf64"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W1144919104","https://openalex.org/W2032931058","https://openalex.org/W2295675132","https://openalex.org/W2591548807","https://openalex.org/W2921313412","https://openalex.org/W3006087551","https://openalex.org/W4251619229","https://openalex.org/W4399795410","https://openalex.org/W4401863414","https://openalex.org/W6870020180"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W4387369504","https://openalex.org/W3046775127","https://openalex.org/W4394896187","https://openalex.org/W3170094116","https://openalex.org/W4386462264","https://openalex.org/W3107602296","https://openalex.org/W4364306694","https://openalex.org/W4312192474"],"abstract_inverted_index":{"With":[0,110],"over":[1,82],"7,000":[2],"known":[3],"rare":[4,16,43],"diseases":[5,17],"and":[6,50,56,100,113,118,130],"a":[7,14,33,71,111,124],"prevalence":[8],"of":[9,31,116,126],"less":[10],"than":[11,90],"one":[12],"in":[13,59],"thousand,":[15],"pose":[18],"substantial":[19],"challenges":[20],"to":[21],"advanced":[22],"medical":[23,51,127],"support":[24],"networks.":[25],"This":[26],"study":[27],"investigates":[28],"the":[29,136],"efficacy":[30],"Unrare.me,":[32],"novel":[34],"social":[35],"networking":[36],"platform":[37],"designed":[38],"for":[39,74],"individuals":[40],"affected":[41],"by":[42],"diseases,":[44],"including":[45,97],"patients,":[46],"their":[47],"family":[48],"members,":[49],"professionals,":[52],"addressing":[53],"data":[54,128],"sparsity":[55],"combinatorial":[57],"complexities":[58],"user":[60,76,84,101],"matching.":[61],"We":[62],"demonstrate":[63],"that":[64,123],"simple":[65],"matching":[66,85],"heuristics":[67],"already":[68],"serve":[69],"as":[70],"decent":[72],"basis":[73],"collecting":[75],"feedback":[77,86],"on":[78],"match":[79],"quality.":[80],"Leveraging":[81],"10,000":[83],"scores":[87],"from":[88],"more":[89],"2,000":[91],"active":[92],"users,":[93],"we":[94,121],"evaluate":[95],"algorithms":[96],"collaborative":[98],"filtering":[99],"embedding":[102],"similarity":[103],"with":[104],"state-of-the-art":[105],"Large":[106],"Language":[107],"Models":[108],"(LLMs).":[109],"top-10":[112],"top-5":[114],"hit-rate":[115],"55%":[117],"37%,":[119],"respectively,":[120],"show":[122],"combination":[125],"augmentation":[129],"embeddings":[131],"significantly":[132],"enhances":[133],"performance":[134],"beyond":[135],"initial":[137],"heuristic":[138],"baseline.":[139]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
