{"id":"https://openalex.org/W4400572812","doi":"https://doi.org/10.48550/arxiv.2407.06211","title":"Synthetic data: How could it be used for infectious disease research?","display_name":"Synthetic data: How could it be used for infectious disease research?","publication_year":2024,"publication_date":"2024-07-03","ids":{"openalex":"https://openalex.org/W4400572812","doi":"https://doi.org/10.48550/arxiv.2407.06211"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2407.06211","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.06211","pdf_url":"https://arxiv.org/pdf/2407.06211","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2407.06211","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087364126","display_name":"Styliani-Christina Fragkouli","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Fragkouli, Styliani-Christina","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086917765","display_name":"Dhwani Solanki","orcid":"https://orcid.org/0009-0004-1529-0095"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Solanki, Dhwani","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111254970","display_name":"Leyla J Castro","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Castro, Leyla J","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078171708","display_name":"Fotis Psomopoulos","orcid":"https://orcid.org/0000-0002-0222-4273"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Psomopoulos, Fotis E","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080481806","display_name":"N\u00faria Queralt-Rosi\u00f1ach","orcid":"https://orcid.org/0000-0003-0169-8159"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Queralt-Rosinach, N\u00faria","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044037386","display_name":"Davide Cirillo","orcid":"https://orcid.org/0000-0003-4982-4716"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cirillo, Davide","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5059822885","display_name":"Lisa Crossman","orcid":"https://orcid.org/0000-0003-2390-4750"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Crossman, Lisa C","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5087364126"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11819","display_name":"Data-Driven Disease Surveillance","score":0.8016999959945679,"subfield":{"id":"https://openalex.org/subfields/2713","display_name":"Epidemiology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T11819","display_name":"Data-Driven Disease Surveillance","score":0.8016999959945679,"subfield":{"id":"https://openalex.org/subfields/2713","display_name":"Epidemiology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/infectious-disease","display_name":"Infectious disease (medical specialty)","score":0.6184107661247253},{"id":"https://openalex.org/keywords/disease","display_name":"Disease","score":0.5186578631401062},{"id":"https://openalex.org/keywords/research-data","display_name":"Research data","score":0.44181787967681885},{"id":"https://openalex.org/keywords/virology","display_name":"Virology","score":0.4043439030647278},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.3811219334602356},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.34483203291893005},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.32518836855888367},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.2978445887565613},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.27840930223464966},{"id":"https://openalex.org/keywords/pathology","display_name":"Pathology","score":0.10546353459358215}],"concepts":[{"id":"https://openalex.org/C524204448","wikidata":"https://www.wikidata.org/wiki/Q788926","display_name":"Infectious disease (medical specialty)","level":3,"score":0.6184107661247253},{"id":"https://openalex.org/C2779134260","wikidata":"https://www.wikidata.org/wiki/Q12136","display_name":"Disease","level":2,"score":0.5186578631401062},{"id":"https://openalex.org/C3020038283","wikidata":"https://www.wikidata.org/wiki/Q42848","display_name":"Research data","level":3,"score":0.44181787967681885},{"id":"https://openalex.org/C159047783","wikidata":"https://www.wikidata.org/wiki/Q7215","display_name":"Virology","level":1,"score":0.4043439030647278},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.3811219334602356},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.34483203291893005},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.32518836855888367},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.2978445887565613},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.27840930223464966},{"id":"https://openalex.org/C142724271","wikidata":"https://www.wikidata.org/wiki/Q7208","display_name":"Pathology","level":1,"score":0.10546353459358215},{"id":"https://openalex.org/C91632574","wikidata":"https://www.wikidata.org/wiki/Q15088675","display_name":"Data curation","level":2,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"pmh:oai:arXiv.org:2407.06211","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.06211","pdf_url":"https://arxiv.org/pdf/2407.06211","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},{"id":"pmh:doi:10.48550/arxiv.2407.06211","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2407.06211","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2407.06211","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2407.06211","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.06211","pdf_url":"https://arxiv.org/pdf/2407.06211","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4400572812.pdf","grobid_xml":"https://content.openalex.org/works/W4400572812.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2007075040","https://openalex.org/W1489156230","https://openalex.org/W2126232866","https://openalex.org/W1966515077","https://openalex.org/W2060843273","https://openalex.org/W4205149165","https://openalex.org/W2018501181","https://openalex.org/W2015220664","https://openalex.org/W2017421301","https://openalex.org/W2124479668"],"abstract_inverted_index":{"Over":[0],"the":[1,31,39,52,135,181,194,219],"last":[2],"three":[3],"to":[4,11,59,140,152,196,204,214],"five":[5],"years,":[6],"it":[7],"has":[8],"become":[9],"possible":[10],"generate":[12],"machine":[13,103],"learning":[14,104],"synthetic":[15,84,199,225],"data":[16,87,93,121,200,226],"for":[17],"healthcare-related":[18],"uses.":[19],"However,":[20],"concerns":[21],"have":[22],"been":[23],"raised":[24],"about":[25],"potential":[26,40],"negative":[27],"factors":[28],"associated":[29],"with":[30,83],"possibilities":[32,82],"of":[33,42,54,65,114,128,142,183,218,224],"artificial":[34,44,110],"dataset":[35],"generation.":[36],"These":[37,147],"include":[38],"misuse":[41],"generative":[43,123],"intelligence":[45,111],"(AI)":[46],"in":[47,92,96,102,130,227],"fields":[48],"such":[49],"as":[50],"cybercrime,":[51],"use":[53,141],"deepfakes":[55],"and":[56,63,77,81,99,137,157,163,187,221],"fake":[57],"news":[58],"deceive":[60],"or":[61,119],"manipulate,":[62],"displacement":[64],"human":[66],"jobs":[67],"across":[68],"various":[69],"market":[70],"sectors.":[71],"Here,":[72],"we":[73,212],"consider":[74,197],"both":[75],"current":[76,220],"future":[78,222],"positive":[79],"advances":[80],"datasets.":[85],"Synthetic":[86],"offers":[88],"significant":[89],"benefits,":[90],"particularly":[91],"privacy,":[94],"research,":[95],"balancing":[97],"datasets":[98],"reducing":[100],"bias":[101],"models.":[105,124],"Generative":[106],"AI":[107],"is":[108,192],"an":[109,171,216],"genre":[112],"capable":[113],"creating":[115],"text,":[116],"images,":[117],"video":[118],"other":[120,158],"using":[122],"The":[125],"recent":[126],"explosion":[127],"interest":[129],"GenAI":[131,185],"was":[132],"heralded":[133],"by":[134,180],"invention":[136],"speedy":[138],"move":[139],"large":[143],"language":[144,155,160],"models":[145,149],"(LLM).":[146],"computational":[148],"are":[150,164],"able":[151],"achieve":[153],"general-purpose":[154],"generation":[156],"natural":[159],"processing":[161],"tasks":[162],"based":[165],"on":[166],"transformer":[167],"architectures,":[168],"which":[169],"made":[170],"evolutionary":[172],"leap":[173],"from":[174],"previous":[175],"neural":[176],"network":[177],"architectures.":[178],"Fuelled":[179],"advent":[182],"improved":[184],"techniques":[186],"wide":[188],"scale":[189],"usage,":[190],"this":[191,210],"surely":[193],"time":[195],"how":[198],"can":[201],"be":[202],"used":[203],"advance":[205],"infectious":[206,228],"disease":[207,229],"research.":[208,230],"In":[209],"commentary":[211],"aim":[213],"create":[215],"overview":[217],"position":[223]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
