{"id":"https://openalex.org/W4394948556","doi":"https://doi.org/10.48550/arxiv.2404.11276","title":"Towards Data-Centric Automatic R&amp;D","display_name":"Towards Data-Centric Automatic R&amp;D","publication_year":2024,"publication_date":"2024-04-17","ids":{"openalex":"https://openalex.org/W4394948556","doi":"https://doi.org/10.48550/arxiv.2404.11276"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2404.11276","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.11276","pdf_url":"https://arxiv.org/pdf/2404.11276","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2404.11276","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5095777598","display_name":"Haotian Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Chen, Haotian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5095777599","display_name":"Xinjie Shen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Xinjie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5095777600","display_name":"Zeqi Ye","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ye, Zeqi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Feng, Wenjun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Feng, Wenjun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Wang, Haoxue","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Haoxue","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5095777601","display_name":"Xiao Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Xiao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5095777602","display_name":"Xu Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Xu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5095777603","display_name":"Weiqing Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Weiqing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5095777604","display_name":"Jiang Bian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bian, Jiang","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5095777598"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.7731999754905701,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.7731999754905701,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11801","display_name":"Reservoir Engineering and Simulation Methods","score":0.7731999754905701,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.763700008392334,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.39027658104896545}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.39027658104896545}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2404.11276","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.11276","pdf_url":"https://arxiv.org/pdf/2404.11276","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2404.11276","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2404.11276","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2404.11276","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.11276","pdf_url":"https://arxiv.org/pdf/2404.11276","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4394948556.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2382290278","https://openalex.org/W4391913857","https://openalex.org/W2350741829","https://openalex.org/W2530322880"],"abstract_inverted_index":{"The":[0,30],"progress":[1],"of":[2,56,64,140,217],"humanity":[3],"is":[4,83,153],"driven":[5],"by":[6,11,22,100],"those":[7],"successful":[8,71],"discoveries":[9,72],"accompanied":[10],"countless":[12],"failed":[13],"experiments.":[14,29],"Researchers":[15],"often":[16],"seek":[17],"the":[18,39,42,61,69,93,98,113,135,157,215,218],"potential":[19,70,177,219],"research":[20,78,168,172],"directions":[21],"reading":[23],"and":[24,66,79,137,144,170],"then":[25],"verifying":[26],"them":[27],"through":[28],"process":[31,82],"imposes":[32],"a":[33,53,77,102,121],"significant":[34,181],"burden":[35,63],"on":[36,133],"researchers.":[37],"In":[38,87],"past":[40],"decade,":[41],"data-driven":[43],"black-box":[44],"deep":[45],"learning":[46],"method":[47],"has":[48],"demonstrated":[49],"its":[50],"effectiveness":[51],"in":[52,115,146],"wide":[54],"range":[55],"real-world":[57],"scenarios,":[58],"which":[59],"exacerbates":[60],"experimental":[62],"researchers":[65],"thus":[67,213],"renders":[68],"veiled.":[73],"Therefore,":[74],"automating":[75],"such":[76],"development":[80,182],"(R&amp;D)":[81],"an":[84],"urgent":[85],"need.":[86],"this":[88],"paper,":[89],"we":[90],"serve":[91],"as":[92,120],"first":[94],"effort":[95],"to":[96,123,156,178,183,188,200,203,222],"formalize":[97],"goal":[99,129],"proposing":[101],"Real-world":[103],"Data-centric":[104],"automatic":[105,117,209],"R&amp;D":[106,118,210],"Benchmark,":[107],"namely":[108],"RD2Bench.":[109],"RD2Bench":[110,152],"benchmarks":[111],"all":[112],"operations":[114],"data-centric":[116],"(D-CARD)":[119],"whole":[122],"navigate":[124],"future":[125,201],"work":[126,202],"toward":[127],"our":[128],"directly.":[130],"We":[131,198],"focus":[132],"evaluating":[134],"interaction":[136],"synergistic":[138],"effects":[139],"various":[141],"model":[142,162],"capabilities":[143],"aiding":[145],"selecting":[147],"well-performing":[148],"trustworthy":[149],"models.":[150],"Although":[151],"very":[154],"challenging":[155],"state-of-the-art":[158],"(SOTA)":[159],"large":[160],"language":[161],"(LLM)":[163],"named":[164],"GPT-4,":[165],"indicating":[166],"ample":[167],"opportunities":[169,216],"more":[171,180],"efforts,":[173],"LLMs":[174],"possess":[175],"promising":[176],"bring":[179],"D-CARD:":[184],"They":[185],"are":[186],"able":[187],"implement":[189],"some":[190],"simple":[191],"methods":[192],"without":[193],"adopting":[194],"any":[195],"additional":[196],"techniques.":[197],"appeal":[199],"take":[204],"developing":[205],"techniques":[206],"for":[207],"tackling":[208],"into":[211],"consideration,":[212],"bringing":[214],"revolutionary":[220],"upgrade":[221],"human":[223],"productivity.":[224]},"counts_by_year":[],"updated_date":"2026-03-25T23:56:10.502304","created_date":"2024-04-19T00:00:00"}
