{"id":"https://openalex.org/W7138446791","doi":"https://doi.org/10.48550/arxiv.2603.14473","title":"AI Can Learn Scientific Taste","display_name":"AI Can Learn Scientific Taste","publication_year":2026,"publication_date":"2026-03-15","ids":{"openalex":"https://openalex.org/W7138446791","doi":"https://doi.org/10.48550/arxiv.2603.14473"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.14473","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.14473","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.14473","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113207942","display_name":"Jingqi Tong","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Tong, Jingqi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129723923","display_name":"Mingzhe Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Mingzhe","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129750790","display_name":"Hangcheng Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Hangcheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129741941","display_name":"Yongzhuo Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Yongzhuo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111122132","display_name":"Yurong Mou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mou, Yurong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129729588","display_name":"Weijie Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Weijie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123936692","display_name":"Zhiheng Xi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xi, Zhiheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129665754","display_name":"Hongji Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Hongji","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129729984","display_name":"Xiaoran Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Xiaoran","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126955818","display_name":"Qinyuan Cheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cheng, Qinyuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129715343","display_name":"Ming Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Ming","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129668195","display_name":"Qiguang Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Qiguang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129729373","display_name":"Weifeng Ge","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ge, Weifeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129721342","display_name":"Qipeng Guo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Qipeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073076889","display_name":"Tianlei Ying","orcid":"https://orcid.org/0000-0002-9597-2843"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ying, Tianlei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126960455","display_name":"Tianxiang Sun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Tianxiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129715659","display_name":"Yining Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng, Yining","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129727927","display_name":"Xinchi Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Xinchi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129747926","display_name":"Jun Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Jun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129724870","display_name":"Ning Ding","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ding, Ning","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129739902","display_name":"Xuanjing Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Xuanjing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129687371","display_name":"Yugang Jiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiang, Yugang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129658175","display_name":"Xipeng Qiu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qiu, Xipeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":23,"corresponding_author_ids":["https://openalex.org/A5113207942"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.4293999969959259,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.4293999969959259,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13274","display_name":"Expert finding and Q&A systems","score":0.05979999899864197,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.04600000008940697,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/judgement","display_name":"Judgement","score":0.7914000153541565},{"id":"https://openalex.org/keywords/taste","display_name":"Taste","score":0.7630000114440918},{"id":"https://openalex.org/keywords/preference","display_name":"Preference","score":0.7032999992370605},{"id":"https://openalex.org/keywords/sociology-of-scientific-knowledge","display_name":"Sociology of scientific knowledge","score":0.421999990940094},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.3953000009059906},{"id":"https://openalex.org/keywords/scientific-evidence","display_name":"Scientific evidence","score":0.38199999928474426},{"id":"https://openalex.org/keywords/scientific-reasoning","display_name":"Scientific reasoning","score":0.36079999804496765}],"concepts":[{"id":"https://openalex.org/C2776548248","wikidata":"https://www.wikidata.org/wiki/Q12621536","display_name":"Judgement","level":2,"score":0.7914000153541565},{"id":"https://openalex.org/C8868529","wikidata":"https://www.wikidata.org/wiki/Q124794","display_name":"Taste","level":2,"score":0.7630000114440918},{"id":"https://openalex.org/C2781249084","wikidata":"https://www.wikidata.org/wiki/Q908656","display_name":"Preference","level":2,"score":0.7032999992370605},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5009999871253967},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.4253000020980835},{"id":"https://openalex.org/C195732255","wikidata":"https://www.wikidata.org/wiki/Q981008","display_name":"Sociology of scientific knowledge","level":2,"score":0.421999990940094},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.41749998927116394},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3953000009059906},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.3824999928474426},{"id":"https://openalex.org/C124056412","wikidata":"https://www.wikidata.org/wiki/Q3320364","display_name":"Scientific evidence","level":2,"score":0.38199999928474426},{"id":"https://openalex.org/C2992562121","wikidata":"https://www.wikidata.org/wiki/Q3817808","display_name":"Scientific reasoning","level":2,"score":0.36079999804496765},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.3571000099182129},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.35359999537467957},{"id":"https://openalex.org/C181204326","wikidata":"https://www.wikidata.org/wiki/Q7239820","display_name":"Preference learning","level":3,"score":0.3474999964237213},{"id":"https://openalex.org/C23213167","wikidata":"https://www.wikidata.org/wiki/Q2351730","display_name":"Scientific progress","level":2,"score":0.32910001277923584},{"id":"https://openalex.org/C2781083858","wikidata":"https://www.wikidata.org/wiki/Q17327049","display_name":"Scientific literature","level":2,"score":0.31439998745918274},{"id":"https://openalex.org/C138379479","wikidata":"https://www.wikidata.org/wiki/Q1116876","display_name":"Scientific modelling","level":2,"score":0.2863999903202057},{"id":"https://openalex.org/C2992915469","wikidata":"https://www.wikidata.org/wiki/Q2465832","display_name":"Scientific field","level":3,"score":0.263700008392334},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.26179999113082886}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.14473","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.14473","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.14473","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.14473","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Great":[0],"scientists":[1],"have":[2],"strong":[3],"judgement":[4],"and":[5,27,76,85,98,146,153],"foresight,":[6],"closely":[7],"tied":[8],"to":[9,20,22,25,106,126,148],"what":[10],"we":[11,16,58,91,119],"call":[12],"scientific":[13,51,78,175],"taste.":[14],"Here,":[15],"use":[17],"the":[18,23],"term":[19],"refer":[21],"capacity":[24],"judge":[26,107],"propose":[28,59,127],"research":[29,38,128,160],"ideas":[30,129,161],"with":[31,130,162],"high":[32,131],"potential":[33,132,164],"impact.":[34,133],"However,":[35],"most":[36],"relative":[37],"focuses":[39],"on":[40,95],"improving":[41],"an":[42,49],"AI":[43,172,184],"scientist's":[44],"executive":[45],"capability,":[46],"while":[47],"enhancing":[48],"AI's":[50],"taste":[52,79],"remains":[53],"underexplored.":[54],"In":[55],"this":[56],"work,":[57],"Reinforcement":[60],"Learning":[61],"from":[62],"Community":[63],"Feedback":[64],"(RLCF),":[65],"a":[66,82,116,121,178],"training":[67],"paradigm":[68],"that":[69,171],"uses":[70],"large-scale":[71],"community":[72],"signals":[73],"as":[74,81,115],"supervision,":[75],"formulate":[77],"learning":[80],"preference":[83,89,110],"modeling":[84],"alignment":[86],"problem.":[87],"For":[88,109],"modeling,":[90],"train":[92,120],"Scientific":[93,113,124,136,157],"Judge":[94,114,137],"700K":[96],"field-":[97],"time-matched":[99],"pairs":[100],"of":[101],"high-":[102],"vs.":[103],"low-citation":[104],"papers":[105],"ideas.":[108],"alignment,":[111],"using":[112],"reward":[117],"model,":[118,123],"policy":[122],"Thinker,":[125],"Experiments":[134],"show":[135,170],"outperforms":[138],"SOTA":[139],"LLMs":[140],"(e.g.,":[141],"GPT-5.2,":[142],"Gemini":[143],"3":[144],"Pro)":[145],"generalizes":[147],"future-year":[149],"test,":[150],"unseen":[151],"fields,":[152],"peer-review":[154],"preference.":[155],"Furthermore,":[156],"Thinker":[158],"proposes":[159],"higher":[163],"impact":[165],"than":[166],"baselines.":[167],"Our":[168],"findings":[169],"can":[173],"learn":[174],"taste,":[176],"marking":[177],"key":[179],"step":[180],"toward":[181],"reaching":[182],"human-level":[183],"scientists.":[185]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-03-18T00:00:00"}
